j30231's picture
Upload 59 files
0313279 verified
{
"metadata": {
"model_name": "llama-3.3-70b-instruct",
"ntrain": 0,
"ntest": -1,
"timestamp": "20241212-064359"
},
"subject": "high_school_statistics",
"category": "STEM",
"correct_rate": 68.05555555555556,
"evaluation_results": [
{
"question": "The weight of an aspirin tablet is 300 milligrams according to the bottle label. An FDA investigator weighs a simple random sample of seven tablets, obtains weights of 299, 300, 305, 302, 299, 301, and 303, and runs a hypothesis test of the manufacturer's claim. Which of the following gives the P-value of this test?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 49.53250193595886
},
{
"question": "The waiting times for a new roller coaster ride are normally distributed with a mean of 35 minutes and a standard deviation of 10 minutes. If there are 150,000 riders the first summer, which of the following is the shortest time interval associated with 100,000 riders?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 49.53339099884033
},
{
"question": "All of the following statements are true for all discrete random variables except for which one?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.533722162246704
},
{
"question": "Which of the following is a true statement about hypothesis testing?",
"model_answer": "A.",
"correct_answer": 3,
"is_correct": false,
"response_time": 49.533987045288086
},
{
"question": "An outlier is an observation that",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.53425312042236
},
{
"question": "The principal of a school is interested in estimating the average income per family of her students. She selects a random sample of students and collects information about their family income. A 95 percent confidence interval computed from this data for the mean income per family is ($35,095, $45,005). Which of the following provides the best interpretation of this confidence interval?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.53451108932495
},
{
"question": "Researchers are conducting an experiment using a significance level of 0.05. The null hypothesis is, in fact, false. If they modify their experiment to use twice as many experimental units for each treatment, which of the following would be true?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.53460502624512
},
{
"question": "The mean height of adult men is 70 inches, with a standard deviation of four inches. The mean height of adult women is 66 inches, with a standard deviation of three inches. Between a man with a height of 74 inches and a woman with a height of 70 inches, who is more unusually tall within his or her respective sex?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.534696102142334
},
{
"question": "Which of the following is not true about t-distributions?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 49.53478384017944
},
{
"question": "To study the effect of alcohol on reaction time, subjects were randomly selected and given three beers to consume. Their reaction time to a simple stimulus was measured before and after drinking the alcohol. Which of the following is a correct statement?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.53486895561218
},
{
"question": "Which of these statements correctly explains bias?",
"model_answer": "B.",
"correct_answer": 0,
"is_correct": false,
"response_time": 38.033722162246704
},
{
"question": "A company that produces facial tissues continually monitors tissue strength. If the mean strength from sample data drops below a specified level, the production process is halted and the machinery inspected. Which of the following would result from a Type I error?",
"model_answer": "D",
"correct_answer": 2,
"is_correct": false,
"response_time": 38.03383803367615
},
{
"question": "The longevity of people living in a certain locality has a standard deviation of 14 years. What is the mean longevity if 30% of the people live longer than 75 years? Assume a normal distribution for life spans.",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 38.033931016922
},
{
"question": "Changing from a 90% confidence interval estimate for a population proportion to a 99% confidence interval estimate, with all other things being equal,",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 38.03403306007385
},
{
"question": "Which of the following is a binomial random variable?",
"model_answer": "C",
"correct_answer": 3,
"is_correct": false,
"response_time": 38.0341260433197
},
{
"question": "If all the other variables remain constant, which of the following will increase the power of a hypothesis test? I.Increasing the sample size. II.Increasing the significance level. III.Increasing the probability of a Type II error.",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 38.0342161655426
},
{
"question": "Which of the following statements is (are) true? I. In order to use a χ2 procedure, the expected value for each cell of a one- or two-way table must be at least 5. II. In order to use χ2 procedures, you must have at least 2 degrees of freedom. III. In a 4 × 2 two-way table, the number of degrees of freedom is 3.",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 38.034306049346924
},
{
"question": "Suppose two events, E and F, have nonzero probabilities p and q, respectively. Which of the following is impossible?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 38.03440999984741
},
{
"question": "The probability that there will be an accident on Highway 48 each day depends on the weather. If the weather is dry that day, there is a 0.2% chance of an accident on Highway 48; if the weather is wet that day, there is a 1.0% chance of an accident. Today, the weather station announced that there is a 20% chance of the weather being wet. What is the probability that there will be an accident on Highway 48 today?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 38.03452515602112
},
{
"question": "The binomial distribution is an appropriate model for which of the following?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 38.03461694717407
},
{
"question": "Data were collected on two variables X and Y and a least squares regression line was fitted to the data. The estimated equation for this data is y = –2.29 + 1.70x. One point has x = 5, y = 6. What is the residual for this point?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 41.84061002731323
},
{
"question": "Which of these explains why t should be used instead of z for inference procedures for means.",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 41.84106492996216
},
{
"question": "Which of the following is least likely to reduce bias in a sample survey?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 41.841428995132446
},
{
"question": "For their first exam, students in an AP Statistics class studied an average of 4 hours with a standard deviation of 1 hour. Almost everyone did poorly on the exam, and so for the second exam every student studied 10 hours. What is the correlation between the numbers of hours students studied for each exam?",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 41.841776847839355
},
{
"question": "The appraised values of houses in a city have a mean of $125,000 with a standard deviation of $23,000. Because of a new teachers' contract, the school district needs an extra 10% in funds compared to the previous year. To raise this additional money, the city instructs the assessment office to raise all appraised house values by $5,000. What will be the new standard deviation of the appraised values of houses in the city?",
"model_answer": "A",
"correct_answer": 0,
"is_correct": true,
"response_time": 41.84212803840637
},
{
"question": "A large company has offices in two locations, one in New Jersey and one in Utah. The mean salary of office assistants in the New Jersey office is $28,500. The mean salary of office assistants in the Utah office is $22,500. The New Jersey office has 128 office assistants and the Utah office has 32 office assistants. What is the mean salary paid to the office assistants in this company?",
"model_answer": "D.",
"correct_answer": 3,
"is_correct": true,
"response_time": 41.84268498420715
},
{
"question": "Which of the following is a false statement about simple random samples?",
"model_answer": "C",
"correct_answer": 0,
"is_correct": false,
"response_time": 41.84280514717102
},
{
"question": "A telephone executive instructs an associate to contact 104 customers using their service to obtain their opinions in regard to an idea for a new pricing package. The associate notes the number of customers whose names begin with A and uses a random number table to pick four of these names. She then proceeds to use the same procedure for each letter of the alphabet and combines the 4 × 26 = 104 results into a group to be contacted. Which of the following is a correct conclusion?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 41.8429000377655
},
{
"question": "A company has a choice of three investment schemes. Option I gives a sure $25,000 return on investment. Option II gives a 50% chance of returning $50,000 and a 50% chance of returning $10,000. Option III gives a 5% chance of returning $100,000 and a 95% chance of returning nothing. Which option should the company choose?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 41.8429970741272
},
{
"question": "A one-sided test of a hypothesis about a population mean, based on a sample of size 14, yields a P-value of 0.075. Which of the following best describes the range of tvalues that would have given this P-value?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 41.84308409690857
},
{
"question": "The president of an online music streaming service whose customers pay a fee wants to gather additional information about customers who have joined in the past 12 months. The company plans to send out an e-mail survey to a sample of current customers with a link that gives participants a month of streaming service for free once the survey has been completed. They know that musical tastes vary by geographical region. Which of the following sample plans would produce the most representative sample of its customers?",
"model_answer": "B.",
"correct_answer": 3,
"is_correct": false,
"response_time": 51.87674903869629
},
{
"question": "You need to construct a 94% confidence interval for a population proportion. What is the upper critical value of z to be used in constructing this interval?",
"model_answer": "B.",
"correct_answer": 3,
"is_correct": false,
"response_time": 51.87686014175415
},
{
"question": "A local school has seven math teachers and seven English teachers. When comparing their mean salaries, which of the following is most appropriate?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 51.87695503234863
},
{
"question": "A small kiosk at the Atlanta airport carries souvenirs in the price range of $3.99 to $29.99, with a mean price of $14.75. The airport authorities decide to increase the rent charged for a kiosk by 5 percent. To make up for the increased rent, the kiosk owner decides to increase the prices of all items by 50 cents. As a result, which of the following will happen?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 51.8770489692688
},
{
"question": "The director of a local food bank asks for data on all donations given during the month of November. Of the 100 checks received, the average donation is $155 with a standard deviation of $32. Which of the following is the most appropriate statement?",
"model_answer": "D",
"correct_answer": 0,
"is_correct": false,
"response_time": 51.87714195251465
},
{
"question": "Which of the following describe/s the central limit theorem? I. The mean of the sampling distribution of x-is the same as the mean of the population. II. The standard deviation of the sampling distribution of x-is the same as the standard deviation of x- divided by the square root of the sample size. III. If the sample size is large, the shape of the sampling distribution of x- is approximately normal.",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 51.87723207473755
},
{
"question": "A large city was interested in annexing part of the surrounding county. In a survey conducted by the local newspaper, 58 percent of respondents said they were against the annexation. During the actual vote, not all eligible voters voted, but 56 percent of the respondents voted against the annexation. Which of the following best describes the difference in the percentages obtained from the newspaper poll and the vote itself?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 51.87732195854187
},
{
"question": "After receiving several complaints from his customers about the store being closed on Sundays, a storekeeper decided to conduct a survey. He randomly selected 100 female customers and 120 male customers, and asked them, \"Are you interested in shopping at this store on Sundays?\" He counted the number of customers answering \"yes\" and constructed a 95 percent confidence interval for the difference by subtracting the proportions of female from the proportion of male customers in favor of shopping on Sundays. The resulting interval was (–0.23, –0.18). Which of the following is a correct interpretation of the interval?",
"model_answer": "B.",
"correct_answer": 0,
"is_correct": false,
"response_time": 51.87741208076477
},
{
"question": "Which of the following is the primary difference between an experiment and an observational study?",
"model_answer": "B",
"correct_answer": 0,
"is_correct": false,
"response_time": 51.87750482559204
},
{
"question": "Random variable X is normally distributed, with a mean of 25 and a standard deviation of 4. Which of the following is the approximate interquartile range for this distribution?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 51.87759494781494
},
{
"question": "Which of the following statements about any two events A and B is true?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 45.89702582359314
},
{
"question": "A company has 400 employees. Their mean income is $20,500, and the standard deviation of their incomes is $3,750. The distribution of incomes is normally distributed. How many of the 400 employees do you expect to have an income of between $13,000 and $28,000?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 45.89714169502258
},
{
"question": "As reported on CNN, in a May 1999 national poll 43% of high school students expressed fear about going to school. Which of the following best describes what is meant by the poll having a margin of error of 5%?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 45.897241830825806
},
{
"question": "Suppose you wish to compare the AP Statistics exam results for the male and female students taking AP Statistics at your high school. Which is the most appropriate technique for gathering the needed data?",
"model_answer": "D",
"correct_answer": 0,
"is_correct": false,
"response_time": 45.89733576774597
},
{
"question": "In one study half of a class were instructed to watch exactly 1 hour of television per day, the other half were told to watch 5 hours per day, and then their class grades were compared. In a second study students in a class responded to a questionnaire asking about their television usage and their class grades.",
"model_answer": "D",
"correct_answer": 0,
"is_correct": false,
"response_time": 45.8974289894104
},
{
"question": "In a high school of 1650 students, 132 have personal investments in the stock market. To estimate the total stock investment by students in this school, two plans are proposed. Plan I would sample 30 students at random, find a confidence interval estimate of their average investment, and then multiply both ends of this interval by 1650 to get an interval estimate of the total investment. Plan II would sample 30 students at random from among the 132 who have investments in the market, find a confidence interval estimate of their average investment, and then multiply both ends of this interval by 132 to get an interval estimate of the total investment. Which is the better plan for estimating the total stock market investment by students in this school?",
"model_answer": "A.",
"correct_answer": 1,
"is_correct": false,
"response_time": 45.897521018981934
},
{
"question": "Sampling error occurs",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 45.89761686325073
},
{
"question": "The regression analysis of question 20 indicated that \"R-sq = 98.1%.\" Which of the following is (are) true? I. There is a strong positive linear relationship between the explanatory and response variables. II. There is a strong negative linear relationship between the explanatory and response variables. III. About 98% of the variation in the response variable can be explained by the regression on the explanatory variable.",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 45.89770770072937
},
{
"question": "In a clinic, 50 patients with sleep disorders are randomly assigned to one of two different groups. Patients in one group are given medication before bedtime. Patients in the other group are given blindfolds and played soft music at bedtime. Each patient is attached to a machine that records breathing patterns. From the patterns, it is possible to determine if the patient is awake or asleep. The data will be used to decide which method is more effective in helping patients with sleep disorders. Which of the following statements is correct in the context of this experiment?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 45.897799015045166
},
{
"question": "A study was conducted to test a new style of keyboard in preventing repetitive stress disorders. Volunteers who have had problems with such injuries were randomly assigned to use either a traditional keyboard or the new design. A significance test was conducted with the alternative hypothesis that a smaller proportion of those using the new keyboard will suffer injuries than those using the traditional keyboard. The resulting P-value was 0.07. Which is a correct interpretation of this P-value?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 45.897889852523804
},
{
"question": "A college admissions officer is interested in comparing the SAT math scores of high school applicants who have and have not taken AP Statistics. She randomly pulls the files of five applicants who took AP Statistics and five applicants who did not, and proceeds to run a t-test to compare the mean SAT math scores of the two groups. Which of the following is a necessary assumption?",
"model_answer": "C",
"correct_answer": 3,
"is_correct": false,
"response_time": 39.8782639503479
},
{
"question": "Given that P(E) = 0.32, P(F) = 0.15, and P(E ∩ F) = 0.048, which of the following is a correct conclusion?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 39.87837195396423
},
{
"question": "A medical research team tests for tumor reduction in a sample of patients using three different dosages of an experimental cancer drug. Which of the following is true?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 39.87847304344177
},
{
"question": "A department store at a large mall claims that over 60 percent of the mall’s visitors shop at that store. Let p = the proportion of the mall’s visitors who shop at the store. Which of the following pairs of hypotheses should be used to support this claim?",
"model_answer": "A",
"correct_answer": 0,
"is_correct": true,
"response_time": 39.87857007980347
},
{
"question": "Which of the following can affect the value of the correlation r?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 39.87866425514221
},
{
"question": "In general, how does tripling the sample size change the confidence interval size?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 39.87875699996948
},
{
"question": "Suppose the correlation between two variables is r = 0.19. What is the new correlation if 0.23 is added to all values of the x-variable, every value of the y-variable is doubled, and the two variables are interchanged?",
"model_answer": "D",
"correct_answer": 0,
"is_correct": false,
"response_time": 39.87884783744812
},
{
"question": "Students in AP Statistics class were timed in seconds while solving a series of mathematical brainteasers. One student's time had a standardized score of z = 2.40. If the times are all changed to minutes, what will then be the student's standardized score?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 39.87894010543823
},
{
"question": "An experiment was designed to test the effects of three different types of paint on the durability of wooden toys. Because boys and girls tend to play differently with toys, a randomly selected group of children was divided into two groups by sex. Which of the following statements about this experiment is true?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 39.87903189659119
},
{
"question": "Suppose there is a correlation of r = 0.9 between number of hours per day students study and GPAs. Which of the following is a reasonable conclusion?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 39.87911796569824
},
{
"question": "Estrella wants to become a paramedic and takes a screening exam. Scores on the exam have been approximately normally distributed over the years it has been given. The exam is normed with a mean of 80 and a standard deviation of 9. Only those who score in the top 15% on the test are invited back for further evaluation. Estrella received a 90 on the test. What was her percentile rank on the test, and did she qualify for further evaluation?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 46.614166021347046
},
{
"question": "To test whether extensive exercise lowers the resting heart rate, a study is performed by randomly selecting half of a group of volunteers to exercise 1 hour each morning, while the rest are instructed to perform no exercise. Is this study an experiment or an observational study?",
"model_answer": "A",
"correct_answer": 3,
"is_correct": false,
"response_time": 46.614280223846436
},
{
"question": "Both over-the-counter niacin and the prescription drug Lipitor are known to lower blood cholesterol levels. In one double-blind study Lipitor outperformed niacin. The 95% confidence interval estimate of the difference in mean cholesterol level lowering was (18, 41). Which of the following is a reasonable conclusion?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.6143741607666
},
{
"question": "Fifty oranges of one variety were selected at random and weighed. A 95 percent confidence interval computed from the sample weights to estimate the mean weight of oranges of this variety is (7.58, 8.72) ounces. Which of the following statements is true with respect to the confidence level used?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 46.61446404457092
},
{
"question": "There are two games involving flipping a fair coin. In the first game you win a prize if you can throw between 45% and 55% heads. In the second game you win if you can throw more than 80% heads. For each game would you rather flip the coin 30 times or 300 times?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.61455512046814
},
{
"question": "A company is interested in comparing the mean sales revenue per salesperson at two different locations. The manager takes a random sample of 10 salespeople from each location independently and records the sales revenue generated by each person during the last four weeks. He decides to use a t-test to compare the mean sales revenue at the two locations. Which of the following assumptions is necessary for the validity of the t-test?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.614644050598145
},
{
"question": "Suppose you did 10 independent tests of the form H0: μ = 25 versus Ha: μ < 25, each at the α = 0.05 significance level. What is the probability of committing a Type I error and incorrectly rejecting a true H0 with at least one of the 10 tests?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 46.61474013328552
},
{
"question": "Suppose that 60% of a particular electronic part last over 3 years, while 70% last less than 6 years. Assuming a normal distribution, what are the mean and standard deviation with regard to length of life of these parts?",
"model_answer": "C",
"correct_answer": 1,
"is_correct": false,
"response_time": 46.61483311653137
},
{
"question": "A psychologist believes that positive rewards for proper behavior are more effective than punishment for bad behavior in promoting good behavior in children. A scale of \"proper behavior\" is developed. μ1= the \"proper behavior\" rating for children receiving positive rewards, and μ2= the \"proper behavior\" rating for children receiving punishment. If H0: μ1− μ2= 0, which of the following is the proper statement of HA?",
"model_answer": "C.",
"correct_answer": 0,
"is_correct": false,
"response_time": 46.614920139312744
},
{
"question": "A confidence interval estimate is determined from the monthly grocery expenditures in a random sample of n families. Which of the following will result in a smaller margin of error? I. A smaller confidence level. II. A smaller sample standard deviation. III. A smaller sample size",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 46.6150062084198
},
{
"question": "Which of the following is not important in the design of experiments?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 35.35115599632263
},
{
"question": "Which of the following is a correct statement?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 35.35128092765808
},
{
"question": "Define a new measurement as the difference between the 60th and 40th percentile scores in a population. This measurement will give information concerning",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 35.35137677192688
},
{
"question": "Which of the following is notrequired in a binomial setting?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 35.351475954055786
},
{
"question": "A publisher used standard boxes for shipping books. The mean weight of books packed per box is 25 pounds, with a standard deviation of two pounds. The mean weight of the boxes is one pound, with a standard deviation of 0.15 pounds. The mean weight of the packing material used per box is two pounds, with a standard deviation of 0.25 pounds. What is the standard deviation of the weights of the packed boxes?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 35.35157299041748
},
{
"question": "A group of scientists wanted to estimate the proportion of geese returning to the same site for the next breeding season. Suppose they decided to increase the sample size from 200 to 2,000. How will this affect the distribution of the sample proportion?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 35.35167574882507
},
{
"question": "A telephone survey of 400 registered voters showed that 256 had not yet made up their minds 1 month before the election. How sure can we be that between 60% and 68% of the electorate were still undecided at that time?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 35.35177493095398
},
{
"question": "Players in the National Football League weigh, on average, about 248 pounds with a standard deviation of about 47 pounds. If four players are to be selected at random, the expected value of the random variable W, the total combined weight of the four players, is 992 pounds. The standard deviation of Wis approximately",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 35.351871967315674
},
{
"question": "\"A hypothesis test yields a P-value of 0.20.\" Which of the following best describes what is meant by this statement?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 35.35196495056152
},
{
"question": "Which of the following is not true with regard to contingency tables for chi-square tests for independence?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 35.35205388069153
},
{
"question": "The observed times (in minutes) it takes a runner to complete a marathon are normally distributed. The z-score for his running time this week is –2. Which one of the following statements is a correct interpretation of his z-score?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 51.54874587059021
},
{
"question": "The mean Law School Aptitude Test (LSAT) score for applicants to a particular law school is 650 with a standard deviation of 45. Suppose that only applicants with scores above 700 are considered. What percentage of the applicants considered have scores below 740? (Assume the scores are normally distributed.)",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 51.54888081550598
},
{
"question": "On the same test, Mary and Pam scored at the 64th and 56th percentiles, respectively. Which of the following is a true statement?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 51.548977851867676
},
{
"question": "A study looked at medical records of about 23,000 patients, mostly in Asia. They found that patients who drank at least three cups of green tea per day had a much lower incidence of depression. In an American newspaper article about this study, which of the following statements should not be made?",
"model_answer": "D.",
"correct_answer": 3,
"is_correct": true,
"response_time": 51.54907488822937
},
{
"question": "A researcher planning a survey of school principals in a particular state has lists of the school principals employed in each of the 125 school districts. The procedure is to obtain a random sample of principals from each of the districts rather than grouping all the lists together and obtaining a sample from the entire group. Which of the following is a correct conclusion?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 51.549171924591064
},
{
"question": "In an experiment, the control group should receive",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 51.54926896095276
},
{
"question": "Tina’s science fair project was to estimate the mean amount of chemicals in her city’s water supply. At first, she had decided to use a random sample of 15 observations. But her teacher asked her to take 35 observations. The mean and standard deviation from 35 observations turned out to be approximately the same as those from 15 observations. Is there any advantage in using 35 observations instead of 15 observations?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 51.54936909675598
},
{
"question": "The total cholesterol level in a large population of people is strongly skewed right with a mean of 210 mg/dL and a standard deviation of 15 mg/dL. If random samples of size 16 are repeatedly drawn from this population, which of the following appropriately describes the sampling distribution of these sample means?",
"model_answer": "D",
"correct_answer": 1,
"is_correct": false,
"response_time": 51.54947781562805
},
{
"question": "An experiment is conducted in which the response variable is the average gain in participants' performance in the long jump. A two-sample t-test with a 5% level of significance will be used to analyze the results. If all else is kept the same, which of the following descriptions of a possible change in procedure is true?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 51.5495719909668
},
{
"question": "An assembly line machine is supposed to turn out ball bearings with a diameter of 1.25 centimeters. Each morning the first 30 bearings produced are pulled and measured. If their mean diameter is under 1.23 centimeters or over 1.27 centimeters, the machinery is stopped and an engineer is called to make adjustments before production is resumed. The quality control procedure may be viewed as a hypothesis test with the null hypothesis H0: μ = 1.25 and the alternative hypothesis Ha: μ ≠ 1.25. The engineer is asked to make adjustments when the null hypothesis is rejected. In test terminology, what would a Type II error result in?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 51.5496609210968
},
{
"question": "We are interested in the proportion p of people who are unemployed in a large city. Eight percent of a simple random sample of 500 people are unemployed. What is the midpoint for a 95% confidence interval estimate of p?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 51.55061483383179
},
{
"question": "An insurance company wishes to study the number of years drivers in a large city go between automobile accidents. They plan to obtain and analyze the data from a sample of drivers. Which of the following is a true statement?",
"model_answer": "A.",
"correct_answer": 3,
"is_correct": false,
"response_time": 51.551050901412964
},
{
"question": "Which of the following is the central limit theorem?",
"model_answer": "A.",
"correct_answer": 3,
"is_correct": false,
"response_time": 51.55139493942261
},
{
"question": "A manufacturer of ready-bake cake mixes is interested in designing an experiment to test the effects of four different temperature levels (300, 325, 350, and 375F), two different types of pans (glass and metal), and three different types of ovens (gas, electric, and microwave) on the texture of its cakes, in all combinations. Which of the following below is the best description of the design of the necessary experiment?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 51.55173182487488
},
{
"question": "A study is made to determine whether more hours of academic studying leads to higher point scoring by basketball players. In surveying 50 basketball players, it is noted that the 25 who claim to study the most hours have a higher point average than the 25 who study less. Based on this study, the coach begins requiring the players to spend more time studying. Which of the following is a correct statement?",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 51.55207085609436
},
{
"question": "Biologists around the world have increased efforts at conservation. Monitoring wildlife populations is important so that appropriate management efforts can be implemented, but such monitoring is often difficult. One study found a cheap and easy way to estimate the number of nesting sites of terns (a type of seabird) by monitoring the number of calls heard per minute. More calls happen when there are more birds, as one would expect. In fact, it turned out that the number of calls explained 71% of the variation in the abundance of nests between breeding sites. Which of the following statements is correct about the correlation between the number of calls and the abundance of nests?",
"model_answer": "B.",
"correct_answer": 3,
"is_correct": false,
"response_time": 51.552536964416504
},
{
"question": "A company has 1000 employees evenly distributed throughout five assembly plants. A sample of 30 employees is to be chosen as follows. Each of the five managers will be asked to place the 200 time cards of their respective employees in a bag, shake them up, and randomly draw out six names. The six names from each plant will be put together to make up the sample. Will this method result in a simple random sample of the 1000 employees?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 51.5526659488678
},
{
"question": "A doctor hopes that a new surgery technique will shorten the recovery time compared to the standard technique. To test this, he designed an experiment in which patients who required this type of surgery were randomly assigned to the standard technique or the new technique. Then the mean recovery time for each treatment group was compared. Assuming conditions for inference were met, which analysis should be used?",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 51.55276298522949
},
{
"question": "A researcher plans a study to examine long-term confidence in the U.S. economy among the adult population. She obtains a simple random sample of 30 adults as they leave a Wall Street office building one weekday afternoon. All but two of the adults agree to participate in the survey. Which of the following conclusions is correct?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 51.55287289619446
},
{
"question": "To study the effect of music on piecework output at a clothing manufacturer, two experimental treatments are planned: day-long classical music for one group versus day-long light rock music for another. Which one of the following groups would serve best as a control for this study?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 51.55296778678894
},
{
"question": "During the years 1886 through 2000 there were an average of 8.7 tropical cyclones per year, of which an average of 5.1 became hurricanes. Assuming that the probability of any cyclone becoming a hurricane is independent of what happens to any other cyclone, if there are five cyclones in one year, what is the probability that at least three become hurricanes?",
"model_answer": "C",
"correct_answer": 3,
"is_correct": false,
"response_time": 41.79450583457947
},
{
"question": "A chi-squared test of independence is to be performed on a 3 × 4 contingency table. How many degrees of freedom does this test have?",
"model_answer": "C.",
"correct_answer": 0,
"is_correct": false,
"response_time": 41.794872760772705
},
{
"question": "At a large hospital, the durations of emergency room visits, from check-in to discharge, are approximately normally distributed with a mean of 167 minutes and a standard deviation of 76 minutes. Which interval, to the nearest minute, contains the middle 80% of durations?",
"model_answer": "D",
"correct_answer": 2,
"is_correct": false,
"response_time": 41.79527497291565
},
{
"question": "The relation between studying time (in hours) and grade on a final exam (0-100) in a random sample of students in math class was found to be Grade = 50.25 + 10.2 (h) How will a student’s grade be affected if she studies for two hours?",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 41.79539680480957
},
{
"question": "A producer of skin care products has created a new formula for its cream to cure acne. To compare the effectiveness of the new cream to that of the old cream, it conducted a double-blind randomized experiment. Volunteers with acne tried the old formula on one side of their face and the new formula on the other, and which side got which formula was determined randomly. The response variable was the difference in the number of pimples (old formula - new formula). Which is the correct significance test to perform?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 41.7954957485199
},
{
"question": "A pharmaceutical company wants to test a new cholesterol-reducing drug against the previous drug. It does not anticipate much association between cholesterol level and gender, but it does anticipate an association between cholesterol level and the amount of exercise a person gets. For a randomized block design, it should:",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 41.79558992385864
},
{
"question": "An experiment is to be conducted to determine whether taking fish oil capsules or garlic capsules has more of an effect on cholesterol levels. In past studies it was noted that daily exercise intensity (low, moderate, high) is associated with cholesterol level, but average sleep length (< 5, 5 - 8, > 8 hours) is not associated with cholesterol level. This experiment should be done",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 41.79568266868591
},
{
"question": "A test for heartworm in dogs shows a positive result in 96% of dogs that actually have heartworm, and shows a negative result in 98% of dogs with no heartworm. If heartworm actually occurs in 10% of dogs, what is the probability that a randomly selected dog that tested positive for heartworm actually has heartworm?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 41.79577279090881
},
{
"question": "Suppose X and Y are random variables with μx = 32, σx = 5, μy = 44, and σy = 12. Given that X and Y are independent, what are the mean and standard deviation of the random variable X + Y?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 41.79586362838745
},
{
"question": "A high school sent a survey to a randomly selected sample of 75 of last year's graduating class. 27 of those selected did not return the survey. The best plan of action would be to:",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 41.79595494270325
},
{
"question": "Mr. Bee's statistics class had a standard deviation of 11.2 on a standardized test, while Mr. Em's class had a standard deviation of 5.6 on the same test. Which of the following is the most reasonable conclusion concerning the two classes' performance on the test?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 42.489845991134644
},
{
"question": "When a patient complains to the doctor about a certain set of symptoms, the doctor diagnoses the patient with Condition A 15% of the time. If a patient with these symptoms is diagnosed with Condition A, he or she is diagnosed with Condition B 70% of the time. A patient with these symptoms that is not diagnosed with Condition A is diagnosed with Condition B 10% of the time. What is the probability that a patient with this set of symptoms will be diagnosed with at least one of these conditions?",
"model_answer": "C",
"correct_answer": 0,
"is_correct": false,
"response_time": 42.489964962005615
},
{
"question": "A simple random sample is defined by",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 42.49006199836731
},
{
"question": "In one study on the effect that eating meat products has on weight level, an SRS of 500 subjects who admitted to eating meat at least once a day had their weights compared with those of an independent SRS of 500 people who claimed to be vegetarians. In a second study, an SRS of 500 subjects were served at least one meat meal per day for 6 months, while an independent SRS of 500 others were chosen to receive a strictly vegetarian diet for 6 months, with weights compared after 6 months.",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 42.49015688896179
},
{
"question": "Which of these is a correct description of the term?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.49025511741638
},
{
"question": "In the jury pool available for this week, 30 percent of potential jurors are women. A particular trial requires that, out of a jury of 12, at least three are women. If a jury of 12 is to be selected at random from the pool, what is the probability it meets the requirements of this trial?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.490352153778076
},
{
"question": "An employment placement agency specializes in placing workers in jobs suited for them. From past experience, the agency knows that 20% of all the workers it places will no longer be at the position in which they were placed after one year; however, only 5% of those remaining after the first year leave during the next year. At the start of a year an employer hires 100 workers using this agency, then at the start of the next year the employer hires 100 more. How many of these 200 workers are expected to be on the job at the end of the second year?",
"model_answer": "B.",
"correct_answer": 3,
"is_correct": false,
"response_time": 42.49044990539551
},
{
"question": "A newspaper reporter examined police reports of accidents during the past 12 months to collect data about the speed of a car and its stopping distance. The reporter then constructed a scatterplot and computed a correlation coefficient to show the relation between a car’s speed and its stopping distance. This is an example of",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.49054789543152
},
{
"question": "In which of the following situations is a binomial model not an appropriate model to describe the outcome?",
"model_answer": "D",
"correct_answer": 1,
"is_correct": false,
"response_time": 42.49065113067627
},
{
"question": "Two possible wordings for a questionnaire on a proposed school budget increase are as follows:",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.490745067596436
},
{
"question": "Company I manufactures demolition fuses that burn an average of 50 minutes with a standard deviation of 10 minutes, while company II advertises fuses that burn an average of 55 minutes with a standard deviation of 5 minutes. Which company's fuse is more likely to last at least 1 hour? Assume normal distributions of fuse times.",
"model_answer": "A",
"correct_answer": 2,
"is_correct": false,
"response_time": 46.20134210586548
},
{
"question": "In a random sample of Toyota car owners, 83 out of 112 said they were satisfied with the Toyota front-wheel drive, while in a similar survey of Subaru owners, 76 out of 81 said they were satisfied with the Subaru four-wheel drive. A 90% confidence interval estimate for the difference in proportions between Toyota and Subaru car owners who are satisfied with their drive systems is reported to be -0.197 ± 0.081. Which is a proper conclusion?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.201454162597656
},
{
"question": "Which of the following statements about the correlation coefficient is true?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 46.201555013656616
},
{
"question": "A school board of a large school district is proposing a new dress code for students. Some students feel that this dress code unfairly targets female students. To see if there is a difference between boys and girls in their opposition to the new dress code, they conduct a poll of 60 randomly selected male and 70 randomly selected female high school students in the district. They find that 66 females oppose the dress code and 50 males oppose the dress code. Which of the following explains why a two-proportion z-test is not appropriate?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 46.2016499042511
},
{
"question": "A soft drink dispenser can be adjusted to deliver any fixed number of ounces. If the machine is operating with a standard deviation in delivery equal to 0.3 ounce, what should be the mean setting so that a 12-ounce cup will overflow less than 1% of the time? Assume a normal distribution for ounces delivered.",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 46.201744079589844
},
{
"question": "The average number of calories in Yum-Yum Good candy bars is 210, with a standard deviation of 10. If the number of calories per candy bar is normally distributed, what percent of candy bars contain more than 225 calories?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.20183610916138
},
{
"question": "The mean daily demand for bread at a popular bakery is 2,500 loaves, with a standard deviation of 225 loaves. Every morning the bakery bakes 3,000 loaves. What is the probability that today it will run out of bread? Assume that the mean daily demand for bread at this bakery is normally distributed.",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 46.20192909240723
},
{
"question": "Two dice are rolled simultaneously. If both dice show 6, then the player wins $20; otherwise the player loses the game. It costs $2.00 to play the game. What is the expected gain or loss per game?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.20202112197876
},
{
"question": "Suppose you toss a fair die three times and it comes up an even number each time. Which of the following is a true statement?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.2021119594574
},
{
"question": "Taxicabs in a metropolitan area are driven an average of 75,000 miles per year with a standard deviation of 12,000 miles. What is the probability that a randomly selected cab has been driven less than 100,000 miles if it is known that it has been driven over 80,000 miles? Assume a normal distribution of miles per year among cabs.",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 46.2022020816803
},
{
"question": "The registrar’s office at a university has noticed that a large number of students fail to report a change of address. The registrar decides to take a random sample of 150 students from the current directory of students and determine the number of students with the correct addresses on record. He then uses this information to construct a 95 percent confidence interval. Which of the following statements must be true?",
"model_answer": "C",
"correct_answer": 3,
"is_correct": false,
"response_time": 54.763434171676636
},
{
"question": "A botanist is interested in testing H0: μ = 3.5 cm versus Ha: μ > 3.5, where μ = the mean petal length of one variety of flowers. A random sample of 50 petals gives significant results at a 5 percent level of significance. Which of the following statements about the confidence interval to estimate the mean petal length is true?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 54.7640221118927
},
{
"question": "A dentist has noticed that about two children in every seven whom he sees professionally develop cavities before they turn 10 years old. Last week he examined the teeth of five unrelated children younger than 10. Let X be the number of children who develop cavities before turning 10. Which of the following gives the probability that at least one will develop a cavity before turning 10?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 54.764461040496826
},
{
"question": "Which of the following is NOT true of the χ2 probability distribution function?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 54.76493501663208
},
{
"question": "The relation between the selling price of a car (in $1,000) and its age (in years) is estimated from a random sample of cars of a specific model. The relation is given by the following formula: Selling price = 15.9 – 0.983 (age) Which of the following can we conclude from this equation?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 54.765366077423096
},
{
"question": "Consider a hypothesis test with H0 : μ = 70 and Ha : μ < 70. Which of the following choices of significance level and sample size results in the greatest power of the test when μ = 65?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 54.76549410820007
},
{
"question": "A farmer who raises hens for egg production wants his eggs to have a mean mass of 56 grams. He is considering the purchase of a different type of hen, so he took a random sample of 18 eggs laid by this type of hen. The distribution of the masses is symmetric and mound-shaped with a mean of 54.1 grams and no outliers. The farmer conducted a t-test to see if there is evidence that the eggs from these hens have a mean mass that is different from 56 g and got a test statistic of t= -1.973. If he uses a 5% significance level, which is the correct conclusion and reason?",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 54.76559281349182
},
{
"question": "A school committee member is lobbying for an increase in the gasoline tax to support the county school system. The local newspaper conducted a survey of county residents to assess their support for such an increase. What is the population of interest here?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 54.76568818092346
},
{
"question": "To survey the opinions of the students at your high school, a researcher plans to select every twenty-fifth student entering the school in the morning. Assuming there are no absences, will this result in a simple random sample of students attending your school?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 54.765783071517944
},
{
"question": "Which of the following is a true statement?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 54.76589798927307
},
{
"question": "An automobile service station performs oil changes and tire replacements, as well as other services. Sixty percent of its customers request an oil change, 30 percent request tire replacements, and 10 percent request both. A customer requests an oil change. What is the probability this customer does not request tire replacements?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.73254323005676
},
{
"question": "Which of the following statements is false?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.733094215393066
},
{
"question": "A kidney dialysis center periodically checks a sample of its equipment and performs a major recalibration if readings are sufficiently off target. Similarly, a fabric factory periodically checks the sizes of towels coming off an assembly line and halts production if measurements are sufficiently off target. In both situations, we have the null hypothesis that the equipment is performing satisfactorily. For each situation, which is the more serious concern, a Type I or Type II error?",
"model_answer": "A",
"correct_answer": 2,
"is_correct": false,
"response_time": 49.73413920402527
},
{
"question": "A company with offices in five different countries is interested in estimating the proportion of its employees in favor of banning smoking on the office premises. It is known that the views of people from different countries on issues like smoking tend to vary due to the influence of different local social structures. Which of the following is an appropriate sampling technique to use in this situation, and why?",
"model_answer": "B.",
"correct_answer": 0,
"is_correct": false,
"response_time": 49.73451519012451
},
{
"question": "Semir rolls a six-sided die every morning to determine what he will have for breakfast. If he rolls a 1 or 2, he takes time to cook himself a big breakfast. If he rolls a 3 or larger he grabs a quick lighter breakfast. When he cooks himself a big breakfast, there is a 15% chance he will be late for school. If he has a lighter breakfast, there is a 6% chance he will be late for school. What is the probability Semir will be on time for school any given day?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.73487210273743
},
{
"question": "A teacher's union and a school district are negotiating salaries for the coming year. The teachers want more money, and the district, claiming, as always, budget constraints, wants to pay as little as possible. The district, like most, has a large number of moderately paid teachers and a few highly paid administrators. The salaries of all teachers and administrators are included in trying to figure out, on average, how much the professional staff currently earn. Which of the following would the teachers' union be most likely to quote during negotiations?",
"model_answer": "A.",
"correct_answer": 3,
"is_correct": false,
"response_time": 49.735443115234375
},
{
"question": "The Hardcore Construction Company has two offices, one in Atlanta and one in New Orleans. Fifteen engineers work in the Atlanta office, and 14 engineers work in the New Orleans office. The business manager decided to use a 2-sample t-test to compare the mean salaries of engineers in the two offices. Because there were only 15 engineers in one office and 14 engineers in the other, he used the salaries of all the engineers in the computation. Is the 2-sample t-test an appropriate inferential technique in this situation?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.73557114601135
},
{
"question": "For the regression line, which of the following statements about residuals is true?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 49.73566818237305
},
{
"question": "A reading specialist in a large public school system believes that the more time students spend reading, the better they will do in school. She plans a middle school experiment in which an SRS of 30 eighth graders will be assigned four extra hours of reading per week, an SRS of 30 seventh graders will be assigned two extra hours of reading per week, and an SRS of 30 sixth graders with no extra assigned reading will be a control group. After one school year, the mean GPAs from each group will be compared. Is this a good experimental design?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.7357611656189
},
{
"question": "What is a sampling distribution?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 49.73584818840027
},
{
"question": "A farmer wants to know whether a new fertilizer has increased the mean weight of his apples. With the old fertilizer, the mean weight was 4.0 ounces per apple. The farmer decides to test H0: μ = 4.0 ounces versus Ha : μ > 4.0 ounces, at a 5 percent level of significance, where μ = the mean weight of apples using the new fertilizer. The weights of apples are approximately normally distributed. The farmer takes a random sample of 16 apples and computes a mean of 4.3 ounces and a standard deviation of 0.6 ounces. Which of the following gives the p-value for this test?",
"model_answer": "A",
"correct_answer": 2,
"is_correct": false,
"response_time": 47.124027967453
},
{
"question": "In a study on the effect of music on worker productivity, employees were told that a different genre of background music would be played each day and the corresponding production outputs noted. Every change in music resulted in an increase in production. This is an example of",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 47.124717712402344
},
{
"question": "In a clinical trial, 30 sickle cell anemia patients are randomly assigned to two groups. One group receives the currently marketed medicine, and the other group receives an experimental medicine. Each week, patients report to the clinic where blood tests are conducted. The lab technician is unaware of the kind of medicine the patient is taking. This design can be described as",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 47.1251859664917
},
{
"question": "Suppose that the weights of trucks traveling on the interstate highway system are normally distributed. If 70% of the trucks weigh more than 12,000 pounds and 80% weigh more than 10,000 pounds, what are the mean and standard deviation for the weights of trucks traveling on the interstate system?",
"model_answer": "A.",
"correct_answer": 2,
"is_correct": false,
"response_time": 47.125612020492554
},
{
"question": "An insurance agent is successful in selling a life insurance policy to 20 percent of the customers he contacts. He decides to construct a simulation to estimate the mean number of customers he needs to contact before being able to sell a policy. Which of the following schemes should he use to do the simulation?",
"model_answer": "C",
"correct_answer": 0,
"is_correct": false,
"response_time": 47.12611198425293
},
{
"question": "The midterm scores for a statistics course were approximately normally distributed with a mean of 52 points and a standard deviation of 4 points. The final exam scores were approximately normally distributed with a mean of 112 points and a standard deviation of 10 points. One student had a score of 58 points on the midterm. If she had the same standardized score (z-score) on the final exam, what must her score have been?",
"model_answer": "C",
"correct_answer": 3,
"is_correct": false,
"response_time": 47.12740397453308
},
{
"question": "The sampling distribution of the sample mean is close to the normal distribution",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 47.127521991729736
},
{
"question": "Suppose H0: p = 0.6, and the power of the test for Ha: p = 0.7 is 0.8. Which of the following is a valid conclusion?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 47.127618074417114
},
{
"question": "In one metropolitan region, technical writers have an annual salary that is approximately normally distributed with a mean of $55,800. The first quartile of salaries is $48,815. What is the standard deviation?",
"model_answer": "C",
"correct_answer": 1,
"is_correct": false,
"response_time": 47.127710819244385
},
{
"question": "The amount of rainfall per month in a certain city is approximately normally distributed, with a mean of six inches and a standard deviation of 1.6 inches. Which of the following is the highest amount of rainfall, in inches, this city could have this month for the month to be among the 10percent driest months the city has seen?",
"model_answer": "B",
"correct_answer": 2,
"is_correct": false,
"response_time": 47.12780284881592
},
{
"question": "Which of the following is most useful in establishing cause-and-effect relationships?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.041335105895996
},
{
"question": "A sports talk show asks people to call in and give their opinion of the officiating in the local basketball team's most recent loss. What will most likely be the typical reaction?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 42.04173994064331
},
{
"question": "Alfred and Ben don't know each other but are each considering asking the lovely Charlene to the school prom. The probability that at least one of them will ask her is 0.72. The probability that they both ask her is 0.18. The probability that Alfred asks her is 0.6. What is the probability that Ben asks Charlene to the prom?",
"model_answer": "C",
"correct_answer": 1,
"is_correct": false,
"response_time": 42.04226207733154
},
{
"question": "A random sample of 25 men and a separate random sample of 25 women are selected to answer questions about attitudes toward abortion. The answers were categorized as \"pro-life\" or \"pro-choice.\" Which of the following is the proper null hypothesis for this situation?",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 42.04285216331482
},
{
"question": "A 2008 survey of 500 households concluded that 82% of the population uses grocery coupons. Which of the following best describes what is meant by the poll having a margin of error of 3%?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.04297208786011
},
{
"question": "A hypothesis test is set up so that P(rejecting H0 when H0 is true) = 0.05 and P(failing to reject H0 when H0 is false) = 0.26. What is the power of the test?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.0430691242218
},
{
"question": "For a class project, Charlotte recorded the heights of all 28 students in her class and calculated several statistics. She then realized she made an error recording the height of the tallest person in the class. She correctly had him listed as the tallest, but needed to add two inches to his recorded height to correct it. Which of these measures of spread must remain unchanged?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.04316306114197
},
{
"question": "The main purpose of blocking in an experiment is to:",
"model_answer": "B.",
"correct_answer": 2,
"is_correct": false,
"response_time": 42.043253898620605
},
{
"question": "A manufacturer of motor oil is interested in testing the effects of a newly developed additive on the lifespan of an engine. Twenty-five different engine types are selected at random and each one is tested using oil with the additive and oil without the additive. What type of analysis will yield the most useful information?",
"model_answer": "B.",
"correct_answer": 1,
"is_correct": true,
"response_time": 42.043344020843506
},
{
"question": "To determine the average cost of running for a congressional seat, a simple random sample of 50 politicians is chosen and the politicians' records examined. The cost figures show a mean of $125,000 with a standard deviation of $32,000. Which of the following is the best interpretation of a 90% confidence interval estimate for the average cost of running for office?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 42.04343318939209
},
{
"question": "A filling machine puts an average of four ounces of coffee in jars, with a standard deviation of 0.25 ounces. Forty jars filled by this machine are selected at random. What is the probability that the mean amount per jar filled in the sampled jars is less than 3.9 ounces?",
"model_answer": "B",
"correct_answer": 0,
"is_correct": false,
"response_time": 39.63683795928955
},
{
"question": "A town has one high school, which buses students from urban, suburban, and rural communities. Which of the following samples is recommended in studying attitudes toward tracking of students in honors, regular, and below-grade classes?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 39.63696908950806
},
{
"question": "A shipment of resistors have an average resistance of 200 ohms with a standard deviation of 5 ohms, and the resistances are normally distributed. Suppose a randomly chosen resistor has a resistance under 194 ohms. What is the probability that its resistance is greater than 188 ohms?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 39.63707208633423
},
{
"question": "A major polling organization wants to predict the outcome of an upcoming national election (in terms of the proportion of voters who will vote for each candidate). They intend to use a 95% confidence interval with margin of error of no more than 2.5%. What is the minimum sample size needed to accomplish this goal?",
"model_answer": "A.",
"correct_answer": 2,
"is_correct": false,
"response_time": 39.637173891067505
},
{
"question": "Given that the sample has a standard deviation of zero, which of the following is a true statement?",
"model_answer": "A.",
"correct_answer": 1,
"is_correct": false,
"response_time": 39.6372709274292
},
{
"question": "The number of customers served per day by a large department store is normally distributed, with a mean of 3,250 customers and a standard deviation of 320. Find the range of customers served on the middle 50 percent of days.",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 39.63736581802368
},
{
"question": "Suppose that 54% of the graduates from your high school go on to 4-year colleges, 20% go on to 2-year colleges, 19% find employment, and the remaining 7% search for a job. If a randomly selected student is not going on to a 2-year college, what is the probability she will be going on to a 4-year college?",
"model_answer": "C",
"correct_answer": 3,
"is_correct": false,
"response_time": 39.63746094703674
},
{
"question": "The Department of Health plans to test the lead level in a specific park. Because a high lead level is harmful to children, the park will be closed if the lead level exceeds the allowed limit. The department randomly selects several locations in the park, gets soil samples from those locations, and tests the samples for their lead levels. Which of the following decisions would result from the type I error?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 39.63755702972412
},
{
"question": "For a class project, a student wants to see if boys and girls at their large high school differ in the number of contacts they have stored in their phone. The student conducts a survey of 50 randomly sampled boys and 40 randomly selected girls, and asks them to report the number of contacts. Which of the following is true about this situation?",
"model_answer": "A.",
"correct_answer": 3,
"is_correct": false,
"response_time": 39.637651205062866
},
{
"question": "The probability is 0.2 that a value selected at random from a normal distribution with mean 600 and standard deviation 15 will be above what number?",
"model_answer": "D",
"correct_answer": 2,
"is_correct": false,
"response_time": 39.63774394989014
},
{
"question": "In a group of 10 scores, the largest score is increased by 40 points. What will happen to the mean?",
"model_answer": "D",
"correct_answer": 1,
"is_correct": false,
"response_time": 46.739802837371826
},
{
"question": "The distribution of salaries of a county school system with 4,752 employees is known to be right skewed, with the superintendent’s salary an outlier on the higher side. A random sample of 20 employees was taken and their salaries recorded. A 95 percent t-confidence interval for the mean salary of the county school system employees is ($15,360, $32,470). The t-confidence interval is not appropriate in this situation because",
"model_answer": "B.",
"correct_answer": 3,
"is_correct": false,
"response_time": 46.74146485328674
},
{
"question": "Assume that the masses of chicken eggs are normally distributed with a mean of 45 g and a standard deviation of 4 g. What mass of egg would be the 25th percentile of the masses of all the eggs?",
"model_answer": "C",
"correct_answer": 1,
"is_correct": false,
"response_time": 46.74158692359924
},
{
"question": "A recent poll reported that 43% of Americans approve of the job the president is doing, with a margin of sampling error of ±3.2% at a 95% level of confidence. Which of these correctly interprets that margin of error?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.741679668426514
},
{
"question": "What is the probability of a Type II error when a hypothesis test is being conducted at the 10% significance level (α = 0.10)?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.74177289009094
},
{
"question": "In comparing the life expectancies of two models of refrigerators, the average years before complete breakdown of 10 model A refrigerators is compared with that of 15 model B refrigerators. The 90% confidence interval estimate of the difference is (6, 12). Which of the following is the most reasonable conclusion?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 46.741862773895264
},
{
"question": "A medicine is known to produce side effects in one in five patients taking it. Suppose a doctor prescribes the medicine to four unrelated patients. What is the probability that none of the patients will develop side effects?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 46.74195194244385
},
{
"question": "Which of the following is notan advantage of stratified random sampling over simple random sampling?",
"model_answer": "B",
"correct_answer": 0,
"is_correct": false,
"response_time": 46.74204182624817
},
{
"question": "In the casino game of roulette, there are 38 slots for a ball to drop into when it is rolled around the rim of a revolving wheel: 18 red, 18 black, and 2 green. What is the probability that the first time a ball drops into the red slot is on the 8th trial (in other words, suppose you are betting on red every time-what is the probability of losing 7 straight times before you win the first time)?",
"model_answer": "A",
"correct_answer": 2,
"is_correct": false,
"response_time": 46.74212980270386
},
{
"question": "A talk show host recently reported that in response to his on-air question, 82% of the more than 2500 e-mail messages received through his publicized address supported the death penalty for anyone convicted of selling drugs to children. What does this show?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 46.74221897125244
},
{
"question": "To determine the average number of children living in single-family homes, a researcher picks a simple random sample of 50 such homes. However, even after one follow-up visit the interviewer is unable to make contact with anyone in 8 of these homes. Concerned about nonresponse bias, the researcher picks another simple random sample and instructs the interviewer to keep trying until contact is made with someone in a total of 50 homes. The average number of children is determined to be 1.73. Is this estimate probably too low or too high?",
"model_answer": "A.",
"correct_answer": 2,
"is_correct": false,
"response_time": 36.81667900085449
},
{
"question": "If all the values of a data set are the same, all of the following must equal zero except for which one?",
"model_answer": "A",
"correct_answer": 0,
"is_correct": true,
"response_time": 36.81710505485535
},
{
"question": "A university sent out a survey to a random sample of 120 recent graduates to see how those graduates feel about the education they received. Thirty-two of the graduates did not respond to the survey. Which of these would be the best way to proceed?",
"model_answer": "A.",
"correct_answer": 2,
"is_correct": false,
"response_time": 36.81795692443848
},
{
"question": "Given the probabilities P(A) = 0.3 and P(B) = 0.2, what is the probability of the union P(A ∪ B) if A and B are mutually exclusive? If A and B are independent? If B is a subset of A?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 36.81828212738037
},
{
"question": "Which of the following is true about any discrete probability distribution of a random variable X?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 36.81856322288513
},
{
"question": "Which among the following would result in the narrowest confidence interval?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 36.8188271522522
},
{
"question": "The correlation between height in inches and weight in pounds for a particular class is 0.65. If the heights are converted from inches to centimeters, what will the correlation be? (1 in. = 2.54 cm)",
"model_answer": "D.",
"correct_answer": 3,
"is_correct": true,
"response_time": 36.81908893585205
},
{
"question": "The number of days it takes to build a new house has a variance of 386. A sample of 40 new homes shows an average building time of 83 days. With what confidence can we assert that the average building time for a new house is between 80 and 90 days?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 36.81935119628906
},
{
"question": "A significance test of the hypothesis H0: p= 0.3 against the alternative HA: p> 0.3 found a value of = 0.35 for a random sample of size 95. What is the P-value of this test?",
"model_answer": "B",
"correct_answer": 1,
"is_correct": true,
"response_time": 36.81961393356323
},
{
"question": "Two events A and B each have a nonzero probability. If A and B are independent, which of the following statements is true?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 36.81986904144287
},
{
"question": "A teacher believes that giving her students a practice quiz every week will motivate them to study harder, leading to a greater overall understanding of the course material. She tries this technique for a year, and everyone in the class achieves a grade of at least C. Is this an experiment or an observational study?",
"model_answer": "A.",
"correct_answer": 0,
"is_correct": true,
"response_time": 43.17022109031677
},
{
"question": "Which of these is the best description of a P-value?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 43.17076110839844
},
{
"question": "The financial aid office at a state university conducts a study to determine the total student costs per semester. All students are charged $4500 for tuition. The mean cost for books is $350 with a standard deviation of $65. The mean outlay for room and board is $2800 with a standard deviation of $380. The mean personal expenditure is $675 with a standard deviation of $125. Assuming independence among categories, what is the standard deviation of the total student costs?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 43.17118811607361
},
{
"question": "Self-efficacy (the belief that one has control over one's situation) as it related to job satisfaction was studied. When a group of teachers rated their ability to control their situation and their satisfaction with their job, the two variables had a correlation of 0.30. Which statement follows from this correlation?",
"model_answer": "A",
"correct_answer": 3,
"is_correct": false,
"response_time": 43.17179608345032
},
{
"question": "Suppose X and Y are random variables with E(X) = 312, var(X) = 6, E(X) = 307, and var(Y) = 8. What are the expected value and variance of the random variable X + Y?",
"model_answer": "C",
"correct_answer": 3,
"is_correct": false,
"response_time": 43.1720027923584
},
{
"question": "Consider the two sets X = {10, 30, 45, 50, 55, 70, 90} and Y = {10, 30, 35, 50, 65, 70, 90}. Which of the following is false?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 43.17209815979004
},
{
"question": "Which of the following is a true statement?",
"model_answer": "B",
"correct_answer": 3,
"is_correct": false,
"response_time": 43.17218995094299
},
{
"question": "A researcher is hoping to find a predictive linear relationship between the explanatory and response variables in her study. Accordingly, as part of her analysis she plans to generate a 95% confidence interval for the slope of the regression line for the two variables. The interval is determined to be (0.45, 0.80). Which of the following is (are) true? (Assume conditions for inference are met.) I. She has good evidence of a linear relationship between the variables. II. It is likely that there is a non-zero correlation (r) between the two variables. III. It is likely that the true slope of the regression line is 0.",
"model_answer": "A",
"correct_answer": 0,
"is_correct": true,
"response_time": 43.172279834747314
},
{
"question": "A student organization at a university is interested in estimating the proportion of students in favor of showing movies biweekly instead of monthly. How many students should be sampled to get a 90 percent confidence interval with a width of at most 0.08?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 43.172369956970215
},
{
"question": "A correlation of 0.6 indicates that the percentage of variation in y that is explained by the variation in x is how many times the percentage indicated by a correlation of 0.3?",
"model_answer": "C",
"correct_answer": 2,
"is_correct": true,
"response_time": 43.17245817184448
},
{
"question": "For which of the following is it appropriate to use a census?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 29.069600820541382
},
{
"question": "Which of the following is the best description of the power of a significance test?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 29.069722890853882
},
{
"question": "A drug company will conduct a randomized controlled study on the effectiveness of a new heart disease medication called Heartaid. Heartaid is more expensive than the currently used medication. The analysis will include a significance test with H0: Heartaid and the current medication are equally effective at preventing heart disease and HA: Heartaid is more effective than the current medication at preventing heart disease. Which of these would be a potential consequence of a Type II error?",
"model_answer": "C.",
"correct_answer": 2,
"is_correct": true,
"response_time": 29.06981897354126
},
{
"question": "Two classes take the same exam. Suppose a certain score is at the 40th percentile for the first class and at the 80th percentile for the second class. Which of the following is the most reasonable conclusion?",
"model_answer": "B",
"correct_answer": 0,
"is_correct": false,
"response_time": 29.069916009902954
},
{
"question": "The mean thrust of a certain model jet engine is 9500 pounds. Concerned that a production process change might have lowered the thrust, an inspector tests a sample of units, calculating a mean of 9350 pounds with a z-score of -2.46 and a P-value of 0.0069. Which of the following is the most reasonable conclusion?",
"model_answer": "D",
"correct_answer": 3,
"is_correct": true,
"response_time": 29.07000994682312
},
{
"question": "When the point (15,2) is included, the slope of regression line (y= a+ bx) is b= -0.54. The correlation is r= -0.82. When the point is removed, the new slope is -1.04 and the new correlation coefficient is -0.95. What name is given to a point whose removal has this kind of effect on statistical calculations?",
"model_answer": "D.",
"correct_answer": 3,
"is_correct": true,
"response_time": 29.070103883743286
}
]
}