From 3670219a8f85f90714d728af33a7ab0562def4d6 Mon Sep 17 00:00:00 2001 From: Jake Poznanski Date: Fri, 28 Feb 2025 08:54:47 -0800 Subject: [PATCH] commits --- .../chatgpt/discoverworld_crazy_table4_1.md | 50 + .../sample_data/chatgpt/lincoln_letter_1.md | 15 + .../bench/sample_data/chatgpt/mattsnotes_1.md | 24 + .../chatgpt/multi_column_miss_1.md | 28 + .../bench/sample_data/chatgpt/olmo2-pg4_1.md | 24 + .../chatgpt/openstax_caculus_pg_273_1.md | 57 + .../chatgpt45/discoverworld_crazy_table4_1.md | 3 + .../sample_data/chatgpt45/lincoln_letter_1.md | 11 + .../sample_data/chatgpt45/mattsnotes_1.md | 23 + .../chatgpt45/multi_column_miss_1.md | 12 + .../sample_data/chatgpt45/olmo2-pg4_1.md | 13 + .../chatgpt45/openstax_caculus_pg_273_1.md | 55 + .../discoverworld_crazy_table4_1.md} | 0 .../sample_data/gotocr/lincoln_letter_1.md | 11 + .../bench/sample_data/gotocr/mattsnotes_1.md | 1 + .../multi_column_miss_1.md} | 0 .../bench/sample_data/gotocr/olmo2-pg4_1.md | 89 ++ .../gotocr/openstax_caculus_pg_273_1.md | 1045 +++++++++++++++++ ...le4.md => discoverworld_crazy_table4_1.md} | 0 .../marker/discoverworld_crazy_table4_2.md | 63 + .../marker/discoverworld_crazy_table4_3.md | 63 + .../sample_data/marker/lincoln_letter_1.md | 3 + .../bench/sample_data/marker/mattsnotes_1.md | 5 + ..._column_miss.md => multi_column_miss_1.md} | 0 .../sample_data/marker/multi_column_miss_2.md | 19 + .../sample_data/marker/multi_column_miss_3.md | 21 + .../bench/sample_data/marker/olmo2-pg4_1.md | 25 + .../marker/openstax_caculus_pg_273_1.md | 58 + ...le4.md => discoverworld_crazy_table4_1.md} | 0 .../sample_data/mineru/lincoln_letter_1.md | 1 + .../bench/sample_data/mineru/mattsnotes_1.md | 13 + ..._column_miss.md => multi_column_miss_1.md} | 0 .../bench/sample_data/mineru/olmo2-pg4_1.md | 13 + .../mineru/openstax_caculus_pg_273_1.md | 52 + .../olmocr/discoverworld_crazy_table4.md | 52 - .../olmocr/discoverworld_crazy_table4_1.md | 1 + .../olmocr/discoverworld_crazy_table4_2.md | 1 + .../olmocr/discoverworld_crazy_table4_3.md | 1 + .../olmocr/discoverworld_crazy_table4_4.md | 1 + .../olmocr/discoverworld_crazy_table4_5.md | 50 + .../sample_data/olmocr/lincoln_letter_1.md | 9 + .../sample_data/olmocr/lincoln_letter_2.md | 11 + .../sample_data/olmocr/lincoln_letter_3.md | 9 + .../sample_data/olmocr/lincoln_letter_4.md | 9 + .../sample_data/olmocr/lincoln_letter_5.md | 11 + .../bench/sample_data/olmocr/mattsnotes_1.md | 30 + .../bench/sample_data/olmocr/mattsnotes_2.md | 30 + .../bench/sample_data/olmocr/mattsnotes_3.md | 30 + .../bench/sample_data/olmocr/mattsnotes_4.md | 24 + .../bench/sample_data/olmocr/mattsnotes_5.md | 30 + .../sample_data/olmocr/multi_column_miss.md | 9 - .../sample_data/olmocr/multi_column_miss_1.md | 26 + .../sample_data/olmocr/multi_column_miss_2.md | 34 + .../sample_data/olmocr/multi_column_miss_3.md | 38 + .../sample_data/olmocr/multi_column_miss_4.md | 26 + .../sample_data/olmocr/multi_column_miss_5.md | 17 + .../bench/sample_data/olmocr/olmo2-pg4_1.md | 28 + .../bench/sample_data/olmocr/olmo2-pg4_2.md | 13 + .../bench/sample_data/olmocr/olmo2-pg4_3.md | 13 + .../bench/sample_data/olmocr/olmo2-pg4_4.md | 25 + .../bench/sample_data/olmocr/olmo2-pg4_5.md | 27 + .../olmocr/openstax_caculus_pg_273_1.md | 39 + .../olmocr/openstax_caculus_pg_273_2.md | 73 ++ .../olmocr/openstax_caculus_pg_273_3.md | 73 ++ .../olmocr/openstax_caculus_pg_273_4.md | 73 ++ .../olmocr/openstax_caculus_pg_273_5.md | 71 ++ 66 files changed, 2620 insertions(+), 61 deletions(-) create mode 100644 olmocr/bench/sample_data/chatgpt/discoverworld_crazy_table4_1.md create mode 100644 olmocr/bench/sample_data/chatgpt/lincoln_letter_1.md create mode 100644 olmocr/bench/sample_data/chatgpt/mattsnotes_1.md create mode 100644 olmocr/bench/sample_data/chatgpt/multi_column_miss_1.md create mode 100644 olmocr/bench/sample_data/chatgpt/olmo2-pg4_1.md create mode 100644 olmocr/bench/sample_data/chatgpt/openstax_caculus_pg_273_1.md create mode 100644 olmocr/bench/sample_data/chatgpt45/discoverworld_crazy_table4_1.md create mode 100644 olmocr/bench/sample_data/chatgpt45/lincoln_letter_1.md create mode 100644 olmocr/bench/sample_data/chatgpt45/mattsnotes_1.md create mode 100644 olmocr/bench/sample_data/chatgpt45/multi_column_miss_1.md create mode 100644 olmocr/bench/sample_data/chatgpt45/olmo2-pg4_1.md create mode 100644 olmocr/bench/sample_data/chatgpt45/openstax_caculus_pg_273_1.md rename olmocr/bench/sample_data/{got_ocr/discoverworld_crazy_table4.md => gotocr/discoverworld_crazy_table4_1.md} (100%) create mode 100644 olmocr/bench/sample_data/gotocr/lincoln_letter_1.md create mode 100644 olmocr/bench/sample_data/gotocr/mattsnotes_1.md rename olmocr/bench/sample_data/{got_ocr/multi_column_miss.md => gotocr/multi_column_miss_1.md} (100%) create mode 100644 olmocr/bench/sample_data/gotocr/olmo2-pg4_1.md create mode 100644 olmocr/bench/sample_data/gotocr/openstax_caculus_pg_273_1.md rename olmocr/bench/sample_data/marker/{discoverworld_crazy_table4.md => discoverworld_crazy_table4_1.md} (100%) create mode 100644 olmocr/bench/sample_data/marker/discoverworld_crazy_table4_2.md create mode 100644 olmocr/bench/sample_data/marker/discoverworld_crazy_table4_3.md create mode 100644 olmocr/bench/sample_data/marker/lincoln_letter_1.md create mode 100644 olmocr/bench/sample_data/marker/mattsnotes_1.md rename olmocr/bench/sample_data/marker/{multi_column_miss.md => multi_column_miss_1.md} (100%) create mode 100644 olmocr/bench/sample_data/marker/multi_column_miss_2.md create mode 100644 olmocr/bench/sample_data/marker/multi_column_miss_3.md create mode 100644 olmocr/bench/sample_data/marker/olmo2-pg4_1.md create mode 100644 olmocr/bench/sample_data/marker/openstax_caculus_pg_273_1.md rename olmocr/bench/sample_data/mineru/{discoverworld_crazy_table4.md => discoverworld_crazy_table4_1.md} (100%) create mode 100644 olmocr/bench/sample_data/mineru/lincoln_letter_1.md create mode 100644 olmocr/bench/sample_data/mineru/mattsnotes_1.md rename olmocr/bench/sample_data/mineru/{multi_column_miss.md => multi_column_miss_1.md} (100%) create mode 100644 olmocr/bench/sample_data/mineru/olmo2-pg4_1.md create mode 100644 olmocr/bench/sample_data/mineru/openstax_caculus_pg_273_1.md delete mode 100644 olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4.md create mode 100644 olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_1.md create mode 100644 olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_2.md create mode 100644 olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_3.md create mode 100644 olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_4.md create mode 100644 olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_5.md create mode 100644 olmocr/bench/sample_data/olmocr/lincoln_letter_1.md create mode 100644 olmocr/bench/sample_data/olmocr/lincoln_letter_2.md create mode 100644 olmocr/bench/sample_data/olmocr/lincoln_letter_3.md create mode 100644 olmocr/bench/sample_data/olmocr/lincoln_letter_4.md create mode 100644 olmocr/bench/sample_data/olmocr/lincoln_letter_5.md create mode 100644 olmocr/bench/sample_data/olmocr/mattsnotes_1.md create mode 100644 olmocr/bench/sample_data/olmocr/mattsnotes_2.md create mode 100644 olmocr/bench/sample_data/olmocr/mattsnotes_3.md create mode 100644 olmocr/bench/sample_data/olmocr/mattsnotes_4.md create mode 100644 olmocr/bench/sample_data/olmocr/mattsnotes_5.md delete mode 100644 olmocr/bench/sample_data/olmocr/multi_column_miss.md create mode 100644 olmocr/bench/sample_data/olmocr/multi_column_miss_1.md create mode 100644 olmocr/bench/sample_data/olmocr/multi_column_miss_2.md create mode 100644 olmocr/bench/sample_data/olmocr/multi_column_miss_3.md create mode 100644 olmocr/bench/sample_data/olmocr/multi_column_miss_4.md create mode 100644 olmocr/bench/sample_data/olmocr/multi_column_miss_5.md create mode 100644 olmocr/bench/sample_data/olmocr/olmo2-pg4_1.md create mode 100644 olmocr/bench/sample_data/olmocr/olmo2-pg4_2.md create mode 100644 olmocr/bench/sample_data/olmocr/olmo2-pg4_3.md create mode 100644 olmocr/bench/sample_data/olmocr/olmo2-pg4_4.md create mode 100644 olmocr/bench/sample_data/olmocr/olmo2-pg4_5.md create mode 100644 olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_1.md create mode 100644 olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_2.md create mode 100644 olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_3.md create mode 100644 olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_4.md create mode 100644 olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_5.md diff --git a/olmocr/bench/sample_data/chatgpt/discoverworld_crazy_table4_1.md b/olmocr/bench/sample_data/chatgpt/discoverworld_crazy_table4_1.md new file mode 100644 index 0000000..f408fc7 --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt/discoverworld_crazy_table4_1.md @@ -0,0 +1,50 @@ +Table 4: Baseline model performance on each of the three scoring metrics (*task completion, task process, explanatory knowledge discovery*) across all 24 DISCOVERY WORLD tasks. Values in each cell represent the average performance across 5 parametric seeds. Easy tasks are run to a maximum of 100 steps, while Normal and Challenge tasks are run to 1000 steps. + +| # | Topic | Task | ReACT | Plan+Execute | Hypothesizer | +|----|------------------------------|-----------------------------------|-------|--------------|--------------| +| 1 | Proteomics | Clustering | | | | +| 2 | Easy | Simplified Clustering | 0.87 | 0.20 | 0.08 | +| 3 | Normal | Clustering (2D) | 0.88 | 0.40 | 0.68 | +| 4 | Challenge | Clustering (3D) | 0.88 | 0.40 | 0.60 | +| 5 | Chemistry | Exploring Combinations and Hill Climbing | | | | +| 6 | Easy | Single substances | 0.87 | 1.00 | 0.70 | +| 7 | Normal | Mix of 3 substances | 0.82 | 0.00 | 0.87 | +| 8 | Challenge | Mix of 4 substances | 0.40 | 0.00 | 0.87 | +| 9 | Archaeology | Correlations | | | | +| 10 | Easy | Simple instrument | 0.87 | 0.60 | 0.33 | +| 11 | Normal | Instrument Use | 0.72 | 0.40 | 0.77 | +| 12 | Challenge | Correlation | 0.40 | 0.00 | 0.05 | +| 13 | Reactor Lab | Regression | | | | +| 14 | Easy | Linear regression | 0.42 | 0.00 | 0.10 | +| 15 | Normal | Quadratic regression | 0.43 | 0.00 | 0.00 | +| 16 | Challenge | Uncovering systems of rules | | | | +| 17 | Easy | Simplified rules | 0.91 | 0.60 | 0.78 | +| 18 | Normal | Presence rules | 0.87 | 0.00 | 0.40 | +| 19 | Challenge | Legal Rules | 0.00 | 0.00 | 0.00 | +| 20 | Translation | Rosetta-stone style linguistic discovery of alien language | | | | +| 21 | Easy | Noun and verb | 0.57 | 0.00 | 0.00 | +| 22 | Normal | Noun, adj., and verb | 0.49 | 0.00 | 0.55 | +| 23 | Challenge | | | | | +| 24 | Average (Easy) | | 0.59 | 0.25 | 0.56 | +| 25 | Average (Normal) | | 0.05 | 0.14 | 0.18 | +| 26 | Average (Challenge) | | 0.63 | 0.10 | 0.15 | + +Table 5: Baseline model performance on each of the three scoring metrics (*task completion, task process, explanatory knowledge discovery*) across all 10 unit test tasks. Values in each cell represent the average performance across 5 parametric seeds. Unit tests tasks are run to a maximum of 100 steps. + +| # | Unit Test Topic | ReACT | Plan+Execute | Hypothesizer | +|----|------------------------------|-------|--------------|--------------| +| 25 | Multi-turn dialog with an agent | 1.00 | 1.00 | 1.00 | +| 26 | Measure an object with an instrument | 0.87 | 0.60 | 0.73 | +| 27 | Pick-and-place object | 0.90 | 0.80 | 0.80 | +| 28 | Pick-and-place object | 1.00 | 1.00 | 1.00 | +| 29 | Read DiscoveryFeed posts | 1.00 | 1.00 | 1.00 | +| 30 | Move through doors | 0.55 | 0.20 | 0.25 | +| 31 | Using keys with doors | 0.60 | 0.20 | 0.00 | +| 32 | Navigate to a specific room in a house | 0.20 | 0.00 | 0.00 | +| 33 | Search an environment for an object | 0.80 | 0.00 | 0.00 | +| 34 | Interact with a moving agent | 0.80 | 0.20 | 0.53 | +| 35 | Average (Unit Tests) | 0.76 | 0.60 | 0.66 | + +4.2 Baseline Agent Models + +The baseline agents are described below, with model performance on Discovery tasks shown in Table 4, and performance on Unit Tests shown in Table 5. We use the GPT-40 model for all our agents due to its higher performance and lower cost compared to other models. For space we provide... \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt/lincoln_letter_1.md b/olmocr/bench/sample_data/chatgpt/lincoln_letter_1.md new file mode 100644 index 0000000..c5a87ce --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt/lincoln_letter_1.md @@ -0,0 +1,15 @@ +Executive Mansion, + +Washington City, + +January 10th, 1864. + +Major General Hitchcock, Commissioner for Exchanges, +is authorized and directed to offer Brigadier General Trimble, +now a prisoner of war in Fort McHenry, in exchange for +Major White, who is held as a prisoner at Richmond. +He is also directed to send forward the offer of exchange +by Henry M. Warfield, Esq. of Baltimore, under a flag +of truce, and give him a pass to City Point. + +Abraham Lincoln. \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt/mattsnotes_1.md b/olmocr/bench/sample_data/chatgpt/mattsnotes_1.md new file mode 100644 index 0000000..f3b8d8b --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt/mattsnotes_1.md @@ -0,0 +1,24 @@ +V-February Flow + +Data Components: + +Code: +The-Stack-V2 + +CodeText: +SE, whatever we've scraped + +WebText: +HQDCLM + +DATA MIXES + +~85% Source Code +~10% CodeText +~ 5% Webtext + +~ 85% The-stack-V2 +~ 15% CodeText +~ 0% Webtext + +~100% Source Code \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt/multi_column_miss_1.md b/olmocr/bench/sample_data/chatgpt/multi_column_miss_1.md new file mode 100644 index 0000000..798644c --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt/multi_column_miss_1.md @@ -0,0 +1,28 @@ +stakeholders has occurred in other nations, with groups and individuals refusing to risk being appropriated into the industry's public relations ambitions. It now looks like that with vigilance, tobacco control advocates can easily foment similar distaste in many areas of the business community. Our actions sought to denormalise the tobacco industry by disrupting its efforts to take its place alongside other industries—often with considerable social credit—in the hope that it might gain by association. + +Tobacco industry posturing about its corporate responsibility can never hide the ugly consequences of its ongoing efforts to "work with all relevant stakeholders for the preservation of opportunities for informed adults to consume tobacco products" (translation: "we will build alliances with others who want to profit from tobacco use, to do all we can to counteract effective tobacco control"). BAT has 15.4% and Philip Morris 16.4% of the global cigarette market.6 With 4.9 million smokers currently dying from tobacco use each year, and the industry unblinkingly concurring that its products are addictive, this leaves BAT to argue why it should not be held to be largely accountable for the annual deaths of some 754 600 smokers, and Philip Morris some 803 600 smokers. + +REFERENCES +1 British American Tobacco. Social Report. http://www.bat.com/204pp. +2 Wroe D. Tobacco ad campaign angers MPs. The Age (Melbourne) 2004; May 17 http://www.theage.com.au/articles/2004/05/16/1084646069771.html?oneclick=true. +3 Hirschhorn N. Corporate social responsibility and the tobacco industry: hope or hype? Tobacco Control 2004;13:447–453. +4 Ethical Corporation Asia 2004. Conference website. http://www.ethicalcorp.com/asia2004/. +5 Chapman S, Shatenstein S. Extreme corporate makeover: tobacco companies, corporate responsibility and the corruption of “ethics”. Globalink petition. http://petition.globalink.org/view.php?code= enema. +6 Mackay J, Eriksen M. The tobacco atlas. Geneva: World Health Organization, 2002. + +INDUSTRY WATCH +Corporate social responsibility and the tobacco industry: hope or hype? +N Hirschhorn + +Tobacco Control 2004;13:447–453. doi: 10.1136/tc.2003.006676 + +Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company’s deliberations on the matter, and the company’s perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +Over the past three decades increasing pressure from non-governmental organisations (NGOs), governments and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as “corporate social responsibility” (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to a version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics or as an irretrievably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT +The term “corporate social responsibility” is in vogue at the moment but as a concept it is vague and means different things to different people.1 + +Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of “noblesse oblige”. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century.2 The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of... + +Abbreviations: ASH, Action on Smoking and Health; BAT, British American Tobacco; CERES, Coalition for Environmentally Responsible Economies; CSR, corporate social responsibility; DJSI, Dow Jones Sustainability Index; GCAC, Global Corporate Affairs Council; GRI, Global Reporting Initiative; MSA, Master Settlement Agreement; NGOs, non-governmental organisations; PM, Philip Morris; TNCs, transnational corporations; UNEP, United Nations Environment Program \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt/olmo2-pg4_1.md b/olmocr/bench/sample_data/chatgpt/olmo2-pg4_1.md new file mode 100644 index 0000000..476ebc3 --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt/olmo2-pg4_1.md @@ -0,0 +1,24 @@ +| Source | Type | Tokens | Words | Bytes | Docs | +|------------------------|------------------|--------|-------|--------|-------| +| DCLM-Baseline | Web pages | 3.71T | 3.32T | 21.32T | 2.95B | +| StarCoder | Code | 83.0B | 70.0B | 459B | 78.7M | +| peS2o | Academic papers | 58.6B | 51.1B | 413B | 38.8M | +| arXiv | STEM papers | 20.8B | 19.3B | 77.2B | 3.95M | +| OpenWebMath | Math web pages | 12.2B | 11.1B | 47.2B | 2.89M | +| Algebraic Stack | Math proofs code | 11.8B | 10.8B | 44.0B | 2.83M | +| Wikipedia & Wikibooks | Encyclopedic | 3.7B | 3.16B | 16.2B | 6.17M | +| **Total** | | **3.90T** | **3.48T** | **22.38T** | **3.08B** | + +Table 1: Composition of the pretraining data for OLMo 2. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., 2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki come from Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajama (Together AI, 2023), while OpenWebMath (Paster et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). + +2.1.1 Pretraining data: OLMo 2 Mix 1124 + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over 95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the "baseline 1.0" mix. From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +2.1.2 Mid-training data: Dolmino Mix 1124 + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which Dolmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt/openstax_caculus_pg_273_1.md b/olmocr/bench/sample_data/chatgpt/openstax_caculus_pg_273_1.md new file mode 100644 index 0000000..278460f --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt/openstax_caculus_pg_273_1.md @@ -0,0 +1,57 @@ +3.4 EXERCISES + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +a. Find the velocity and acceleration functions. +b. Determine the time intervals when the object is slowing down or speeding up. + +150. \( s(t) = 2t^3 - 3t^2 - 12t + 8 \) + +151. \( s(t) = 2t^3 - 15t^2 + 36t - 10 \) + +152. \( s(t) = \frac{t}{1 + t^2} \) + +153. A rocket is fired vertically upward from the ground. The distance \( s \) in feet that the rocket travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 560t \). + +a. Find the velocity of the rocket 3 seconds after being fired. +b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/s from the top of a 64-foot-tall building. After \( t \) seconds, its height above the ground is given by \( s(t) = -16t^2 - 8t + 64 \). + +a. Determine how long it takes for the ball to hit the ground. +b. Determine the velocity of the ball when it hits the ground. + +155. The position function \( s(t) = t^2 - 3t - 4 \) represents the position of the back of a car backing out of a driveway and then driving in a straight line, where \( s \) is in feet and \( t \) is in seconds. In this case, \( s(t) = 0 \) represents the time at which the back of the car is at the garage door, so \( s(0) = -4 \) is the starting position of the car, 4 feet inside the garage. + +a. Determine the velocity of the car when \( s(t) = 0 \). +b. Determine the velocity of the car when \( s(t) = 14 \). + +156. The position of a hummingbird flying along a straight line in \( t \) seconds is given by \( s(t) = 3t^3 - 7t \) meters. + +a. Determine the velocity of the bird at \( t = 1 \) sec. +b. Determine the acceleration of the bird at \( t = 1 \) sec. +c. Determine the acceleration of the bird when the velocity equals 0. + +157. A potato is launched vertically upward with an initial velocity of 100 ft/s from a potato gun at the top of an 85-foot-tall building. The distance in feet that the potato travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 100t + 85 \). + +a. Find the velocity of the potato after 0.5 s and 5.75 s. +b. Find the speed of the potato at 0.5 s and 5.75 s. +c. Determine when the potato reaches its maximum height. +d. Find the acceleration of the potato at 0.5 s and 1.5 s. +e. Determine how long the potato is in the air. +f. Determine the velocity of the potato upon hitting the ground. + +158. The position function \( s(t) = t^3 - 8t \) gives the position in miles of a freight train where east is the positive direction and \( t \) is measured in hours. + +a. Determine the direction the train is traveling when \( s(t) = 0 \). +b. Determine the direction the train is traveling when \( a(t) = 0 \). +c. Determine the time intervals when the train is slowing down or speeding up. + +159. The following graph shows the position \( y = s(t) \) of an object moving along a straight line. + +![Graph of position function](image) + +a. Use the graph of the position function to determine the time intervals when the velocity is positive, negative, or zero. +b. Sketch the graph of the velocity function. +c. Use the graph of the velocity function to determine the time intervals when the acceleration is positive, negative, or zero. +d. Determine the time intervals when the object is speeding up or slowing down. \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt45/discoverworld_crazy_table4_1.md b/olmocr/bench/sample_data/chatgpt45/discoverworld_crazy_table4_1.md new file mode 100644 index 0000000..1edc89d --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt45/discoverworld_crazy_table4_1.md @@ -0,0 +1,3 @@ +4.2 Baseline Agent Models + +The baseline agents are described below, with model performance on Discovery tasks shown in Table 4, and performance on Unit Tests shown in Table 5. We use the GPT-4o model for all our agents due to its higher performance and lower cost compared to other models. \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt45/lincoln_letter_1.md b/olmocr/bench/sample_data/chatgpt45/lincoln_letter_1.md new file mode 100644 index 0000000..f49acc3 --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt45/lincoln_letter_1.md @@ -0,0 +1,11 @@ +Executive Mansion, + +Washington City, + +January 10th, 1864 + +Major General Hitchcock, Commissioner of Exchanges, is authorized and directed to offer Brigadier General Trimble, now a prisoner of war in Fort McHenry, in exchange for Major White, who is held as a prisoner at Richmond. + +He is also directed to send forward the offer of exchange by Henry M. Warfield, Esq. of Baltimore, under a flag of truce, and give him a pass to City Point. + +Abraham Lincoln \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt45/mattsnotes_1.md b/olmocr/bench/sample_data/chatgpt45/mattsnotes_1.md new file mode 100644 index 0000000..7f62fd1 --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt45/mattsnotes_1.md @@ -0,0 +1,23 @@ +V-February Flow + +Data Components: +Code: +The-stack-V2 +CodeText: +SE, whatever we've scraped +WebText: +HQOCLM + +DATA MIXES +~85% Source Code +~10% CodeText +~5% Webtext +Deepseek Coder + +~85% The-stack-V2 +~15% CodeText +~0% webtext +Starcoder 2 + +~100% Source Code +Arctic \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt45/multi_column_miss_1.md b/olmocr/bench/sample_data/chatgpt45/multi_column_miss_1.md new file mode 100644 index 0000000..f6b4eae --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt45/multi_column_miss_1.md @@ -0,0 +1,12 @@ +Corporate social responsibility and the tobacco industry: hope or hype? + +N Hirschhorn + +Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company's deliberations on the matter, and the company's perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +Over the past three decades increasing pressure from non-governmental organisations (NGOs), governments and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as "corporate social responsibility" (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics, or as an irretrievably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT +The term "corporate social responsibility" is in vogue at the moment but as a concept it is vague and means different things to different people.1 + +Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of "noblesse oblige". But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century.2 3 The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt45/olmo2-pg4_1.md b/olmocr/bench/sample_data/chatgpt45/olmo2-pg4_1.md new file mode 100644 index 0000000..3444cce --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt45/olmo2-pg4_1.md @@ -0,0 +1,13 @@ +Table 1 Composition of the pretraining data for OLMo 2. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., 2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki come from Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajama (Together AI, 2023), while OpenWebMath (Paster et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). + +2.1.1 Pretraining data: OLMo 2 Mix 1124 + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over 95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the "baseline 1.0" mix. From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +2.1.2 Mid-training data: Dolmino Mix 1124 + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which Dolmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/chatgpt45/openstax_caculus_pg_273_1.md b/olmocr/bench/sample_data/chatgpt45/openstax_caculus_pg_273_1.md new file mode 100644 index 0000000..676d2ba --- /dev/null +++ b/olmocr/bench/sample_data/chatgpt45/openstax_caculus_pg_273_1.md @@ -0,0 +1,55 @@ +3.4 EXERCISES + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +a. Find the velocity and acceleration functions. +b. Determine the time intervals when the object is slowing down or speeding up. + +150. \( s(t) = 2t^3 - 3t^2 - 12t + 8 \) + +151. \( s(t) = 2t^3 - 15t^2 + 36t - 10 \) + +152. \( s(t) = \frac{t}{1 + t^2} \) + +153. A rocket is fired vertically upward from the ground. The distance \( s \) in feet that the rocket travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 560t \). + +a. Find the velocity of the rocket 3 seconds after being fired. +b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/s from the top of a 64-foot-tall building. After \( t \) seconds, its height above the ground is given by \( s(t) = -16t^2 - 8t + 64 \). + +a. Determine how long it takes for the ball to hit the ground. +b. Determine the velocity of the ball when it hits the ground. + +155. The position function \( s(t) = t^2 - 3t - 4 \) represents the position of the back of a car backing out of a driveway and then driving in a straight line, where \( s \) is in feet and \( t \) is in seconds. In this case, \( s(t) = 0 \) represents the time at which the back of the car is at the garage door, so \( s(0) = -4 \) is the starting position of the car, 4 feet inside the garage. + +a. Determine the velocity of the car when \( s(t) = 0 \). +b. Determine the velocity of the car when \( s(t) = 14 \). + +156. The position of a hummingbird flying along a straight line in \( t \) seconds is given by \( s(t) = 3t^3 - 7t \) meters. + +a. Determine the velocity of the bird at \( t = 1 \) sec. +b. Determine the acceleration of the bird at \( t = 1 \) sec. +c. Determine the acceleration of the bird when the velocity equals 0. + +157. A potato is launched vertically upward with an initial velocity of 100 ft/s from a potato gun at the top of an 85-foot-tall building. The distance in feet that the potato travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 100t + 85 \). + +a. Find the velocity of the potato after 0.5 s and 5.75 s. +b. Find the speed of the potato at 0.5 s and 5.75 s. +c. Determine when the potato reaches its maximum height. +d. Find the acceleration of the potato at 0.5 s and 1.5 s. +e. Determine how long the potato is in the air. +f. Determine the velocity of the potato upon hitting the ground. + +158. The position function \( s(t) = t^3 - 8t \) gives the position in miles of a freight train where east is the positive direction and \( t \) is measured in hours. + +a. Determine the direction the train is traveling when \( s(t) = 0 \). +b. Determine the direction the train is traveling when \( a(t) = 0 \). +c. Determine the time intervals when the train is slowing down or speeding up. + +159. The following graph shows the position \( y = s(t) \) of an object moving along a straight line. + +a. Use the graph of the position function to determine the time intervals when the velocity is positive, negative, or zero. +b. Sketch the graph of the velocity function. +c. Use the graph of the velocity function to determine the time intervals when the acceleration is positive, negative, or zero. +d. Determine the time intervals when the object is speeding up or slowing down. \ No newline at end of file diff --git a/olmocr/bench/sample_data/got_ocr/discoverworld_crazy_table4.md b/olmocr/bench/sample_data/gotocr/discoverworld_crazy_table4_1.md similarity index 100% rename from olmocr/bench/sample_data/got_ocr/discoverworld_crazy_table4.md rename to olmocr/bench/sample_data/gotocr/discoverworld_crazy_table4_1.md diff --git a/olmocr/bench/sample_data/gotocr/lincoln_letter_1.md b/olmocr/bench/sample_data/gotocr/lincoln_letter_1.md new file mode 100644 index 0000000..2bbf1bd --- /dev/null +++ b/olmocr/bench/sample_data/gotocr/lincoln_letter_1.md @@ -0,0 +1,11 @@ +43571 +Bachington City +January 10th 1864. +Major General Architect, Commissioner of aivachangera +is authorized and directed by ffeed Bngader General Trelmble, +new a firemen of war in Fert nchery in exchange for +Mayor White, who held a a firemen at Hillmannd. +He is aker conducted by end forward the offer of exchange +by Henry in. Warfield, Lag. of Balthmore, under a flag +of three, and five him afaies to City Bink. +Abraham Lincoln \ No newline at end of file diff --git a/olmocr/bench/sample_data/gotocr/mattsnotes_1.md b/olmocr/bench/sample_data/gotocr/mattsnotes_1.md new file mode 100644 index 0000000..a9f975d --- /dev/null +++ b/olmocr/bench/sample_data/gotocr/mattsnotes_1.md @@ -0,0 +1 @@ +V- February F lew Data Components: Code: The- stack- V 2 Code Text: SE, whatever we' ve Scraped web Test: H& D CL M DATA MEXES ~ 85% So v rie Code De pe scek ~ 5% web text ~ 85% The- s back- V 2 St eur der ~ 15% Code Text 2 ~ 0% web text ~ 10% Source Code \ No newline at end of file diff --git a/olmocr/bench/sample_data/got_ocr/multi_column_miss.md b/olmocr/bench/sample_data/gotocr/multi_column_miss_1.md similarity index 100% rename from olmocr/bench/sample_data/got_ocr/multi_column_miss.md rename to olmocr/bench/sample_data/gotocr/multi_column_miss_1.md diff --git a/olmocr/bench/sample_data/gotocr/olmo2-pg4_1.md b/olmocr/bench/sample_data/gotocr/olmo2-pg4_1.md new file mode 100644 index 0000000..cc336c6 --- /dev/null +++ b/olmocr/bench/sample_data/gotocr/olmo2-pg4_1.md @@ -0,0 +1,89 @@ +Source +Type +Tokens +Words +Bytes +Docs +Pretraining + OLMo 2 1124 Mix +DCLM-Baseline +Web pages +3.71T +3.32T +21.32T +2.95B +StarCoder +f11ered version +from OLMoE Mix +Code +83.0B +70.0B +459B +78.7M +peS2o +from Dolma 1.7 +Academic papers +58.6B +51.1B +413B +38.8M +arXiv +STEM papers +20.8B +19.3B +77.2B +3.95M +OpenWebMath +Math web pages +12.2B +11.1B +47.2B +2.89M +Algebraic Stack +Math proofs code +11.8B +10.8B +44.0B +2.83M +Wikipedia & Wikibooks +from Dolma 1.7 +Encyclopedia +3.7B +3.16B +16.2B +6.17M +Total +3.90T +3.48T +22.38T +3.08B +Table1 CompositionofthepretrainingdataforOLMo2. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., +2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki come from +Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajana (Together AI, 2023), while OpenWebMath (Paster +et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). +2.1.1 +Pretraining data: OLMo 2 Mix 1124 +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over +95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data +used in OLMoE (Muennighoffet al., 2024). +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use +the “baseline 1.0” mix.4 From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., +2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and +Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed +repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove +any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection +of this source, we found it to contain documents encoded in binary format or containing mostly numerical +content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the +document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible +training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details +and show effectiveness of this intervention in Section §3.1. +2.1.2 +Mid-training data: Dolmino Mix 1124 +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that +has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of +which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide +focused exposure to STEM references and high quality text. We generate several variants of this mixture, +with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which +DOLmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep +dive detailing our processes for experimenting and curating data for this mix. +4 \ No newline at end of file diff --git a/olmocr/bench/sample_data/gotocr/openstax_caculus_pg_273_1.md b/olmocr/bench/sample_data/gotocr/openstax_caculus_pg_273_1.md new file mode 100644 index 0000000..ab888a8 --- /dev/null +++ b/olmocr/bench/sample_data/gotocr/openstax_caculus_pg_273_1.md @@ -0,0 +1,1045 @@ +Chapter 3 | Derivatives +273 +3.4 EXERCISES +For the following exercises, the given functions represent +the position of a particle traveling along a horizontal line. +a. +Find the velocity and acceleration functions. +b. +Determine the time intervals when the object is +slowing down or speeding up. +150. +s(t) = 2t3 −3t2 −12t + 8 +151. +s(t) = 2t3 −15t2 + 36t −10 +152. +s(t) = +t +1 + t2 +153. +A rocket is fired vertically upward from the ground. +The distance +s +in +feet +that +the +rocket +travels +from +the +ground after +t seconds is given by +s(t) = −16t2 + 560t. +a. +Find the velocity of the rocket 3 seconds after being +fired. +b. +Find the acceleration of the rocket 3 seconds after +being fired. +154. +A ball is thrown downward with a speed of 8 ft/ +s from the top of a 64-foot-tall building. After t seconds, +its +height +above +the +ground +is +given +by +s(t) = −16t2 −8t + 64. +a. +Determine how long it takes for the ball to hit the +ground. +b. +Determine the velocity of the ball when it hits the +ground. +155. +The position function +s(t) = t2 −3t −4 represents +the position of the back of a car backing out of a driveway +and then driving in a straight line, where +s +is in feet and +t is in seconds. In this case, s(t) = 0 represents the time +at which the back of the car is at the garage door, so +s(0) = −4 is the starting position of the car, 4 feet inside +the garage. +a. +Determine the velocity of the car when +s(t) = 0. +b. +Determine the velocity of the car when +s(t) = 14. +156. +The position of a hummingbird flying along a straight +line in +t seconds is given by +s(t) = 3t3 −7t +2 +2 +2 +2 +2 +2 +2 +2 +2 +2 +3 +3 +3 +3 +3 +3 +3 +3 +3 +3 +4 +4 +4 +4 +4 +4 +4 +4 +4 +4 +5 +5 +5 +5 +5 +5 +5 +5 +5 +5 +4 +4 +4 +4 +4 +4 +4 +4 +4 +3 +3 +3 +3 +3 +3 +3 +3 +3 +1 +1 +1 +1 +1 +1 +1 +1 +1 +1 +3 +3 +3 +3 +3 +3 +3 +3 +3 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +1 +1 +1 +1 +1 +1 +1 +1 +1 +2 +2 +2 +2 +2 +2 +2 +2 +2 +1 +1 +1 +1 +1 +1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +3 +3 +3 +3 +3 +3 +3 +3 +3 +2 +2 +2 +2 +2 +2 +2 +2 +2 +4 +4 +4 +4 +4 +4 +4 +4 +4 +2 +2 +2 +2 +2 +2 +2 +2 +2 +0 +1 +1 +1 +1 +1 +1 +1 +1 +3 +4 +4 +4 +4 +4 +4 +4 +4 +3 +4 +4 +4 +4 +4 +4 +4 +4 +2 +3 +3 +3 +3 +3 +3 +3 +3 +0 +1 +1 +1 +1 +1 +1 +1 +1 +0 +1 +1 +1 +1 +1 +1 +1 +1 +2 +1 +1 +1 +1 +1 +1 +1 +1 +0 +2 +2 +2 +2 +2 +2 +2 +2 +2 +5 +5 +5 +5 +5 +5 +5 +5 +5 +1 +1 +1 +1 +1 +1 +1 +1 +1 +5 +5 +5 +5 +5 +5 +5 +5 +5 +0 +0 +0 +0 +0 +0 +0 +0 +0 +5 +5 +5 +5 +5 +5 +5 +5 +5 +3 +3 +3 +3 +3 +3 +3 +3 +3 +5 +5 +5 +5 +5 +5 +5 +5 +5 +2 +2 +2 +2 +2 +2 +2 +2 +2 +a. +Use the graph of the position function to determine +the time intervals when the velocity is positive, +negative, or zero. +b. +Sketch the graph of the velocity function. +c. +Use the graph of the velocity function to determine +the time intervals when the acceleration is positive, +negative, or zero. +d. +Determine the time intervals when the object is +speeding up or slowing down. +157. +A potato is launched vertically upward with an initial +velocity of 100 ft/s from a potato gun at the top of an +85-foot-tall building. The distance in feet that the potato +travels from the ground after +t seconds is given by +s(t) = −16t2 + 100t + 85. +a. +Find the velocity of the potato after 0.5 s and +5.75 s. +b. +Find the speed of the potato at 0.5 s and 5.75 s. +c. +Determine when the potato reaches its maximum +height. +d. +Find the acceleration of the potato at 0.5 s and 1.5 +s. +e. +Determine how long the potato is in the air. +f. +Determine the velocity of the potato upon hitting +the ground. +158. +The position function +s(t) = t3 −8t gives the +position in miles of a freight train where east is the positive +direction and +t is measured in hours. +a. +Determine the direction the train is traveling when +s(t) = 0. +b. +Determine the direction the train is traveling when +a(t) = 0. +c. +Determine the time intervals when the train is +slowing down or speeding up. +159. +The following graph shows the position +y = s(t) of +an object moving along a straight line. +155. +The position of a hummingbird flying along a straight +line in +t +seconds is given by +s(t) = 3t3 −7t +2 +2 3 +3 +3 +3 +3 +3 +3 +3 +3 +3 3 +3 +3 +3 +3 +3 +3 +3 +3 +0.5 +1 +1.5 +2 +2.5 +3 +3.5 +4 +4.5 +5 +5.5 +6 +6.5 +7 +7.5 +8 +8.5 +9 +9.5 +10 +10.5 +11 +11.5 +12 +12.5 +13 +13.5 +14 +14.5 +15 +15.5 +16 +16.5 +17 +17.5 +18 +18.5 +19 +19.5 +20 +20.5 +21 +21.5 +22 +22.5 +23 +23.5 +24 +24.5 +25 +25.5 +26 +26.5 +27 +27.5 +28 +28.5 +29 +29.5 +30 +30.5 +31 +31.5 +32 +32.5 +33 +33.5 +34 +34.5 +35 +35.5 +36 +36.5 +37 +37.5 +38 +38.5 +39 +39.5 +40 +40.5 +41 +41.5 +42 +42.5 +43 +43.5 +44 +44.5 +45 +45.5 +46 +46.5 +47 +47.5 +48 +48.5 +49 +49.5 +50 +50.5 +51 +51.5 +52 +52.5 +53 +53.5 +54 +54.5 +55 +55.5 +56 +56.5 +57 +57.5 +58 +58.5 +59 +59.5 +60 +60.5 +61 +61.5 +62 +62.5 +63 +63.5 +64 +64.5 +65 +65.5 +66 +66.5 +67 +67.5 +68 +68.5 +69 +69.5 +70 +70.5 +71 +71.5 +72 +72.5 +73 +73.5 +74 +74.5 +75 +75.5 +76 +76.5 +77 +77.5 +78 +78.5 +79 +79.5 +80 +80.5 +81 +81.5 +82 +82.5 +83 +83.5 +84 +84.5 +85 +85.5 +86 +86.5 +87 +87.5 +88 +88.5 +89 +89.5 +90 +90.5 +91 +91.5 +92 +92.5 +93 +93.5 +94 +94.5 +95 +95.5 +96 +96.5 +97 +97.5 +98 +98.5 +99 +99.5 +10 +10.5 +11 +11.5 12 +12 +12.5 +13 +13.5 +14 14.5 +15 +15.5 +16 +16.0 +17 +17.5 +18 +18.5 +19 19.5 +20 +20.5 +21 +21.0 +21.5 +22 +22.5 +23 +23 +23.5 +24 +24.5 +25 25.5 +26 +26.5 +27 +27.0 +27.5 +28 +28.5 +29 +29 +29.5 +30 +30.5 +31 31.5 +32 +32.5 +33 +33.0 +33.5 +34 +34.5 +35 +35 +35.5 +36 +36.5 +38 +38.5 +39 +39.5 +39.5 +40 +40.5 +41 +41 +41.5 +42 +42.5 +43 43.5 +44 +44.5 +45 +45.0 +46 +46.5 +47 +47.5 +48 48.5 +49 +49.5 +50 +50.0 +51 +51.5 +52 +52.5 +53 53.5 +54 +54.5 +55 +55.0 +56 +56.5 +57 +57.5 +58 58.5 +59 +59.5 +60 +60.0 +61 +61.5 +62 +62.5 +63 63.5 +64 +64.5 +65 +65.0 +66 +66.5 +67 +67.5 +68 68.5 +69 +69.5 +70 +70.0 +71 +71.5 +72 +72.5 +73 73.5 +74 +74.5 +75 +75.0 +76 +76.5 +77 +77.5 +78 78.5 +79 +79.5 +80 +80.0 +81 +81.5 +82 +82.5 +83 83.5 +84 +84.5 +85 +85.0 +86 +86.5 +87 +87.5 +88 88.5 +89 +89.5 +90 +90.0 +91 +91.5 +92 +92.5 +93 93.5 +94 +94.5 +95 +95.0 +96 +96.5 +97 +97.5 +98 98.5 +99 +99.5 +10 +10.0 +10.5 +11 +11.0 +11.5 +12 +12.5 +13 +13 +13.5 +14 +14.5 +15 15.5 +16 +16.5 +17 +17.0 +18 +18.5 +19 +19.5 +20 20.5 +21 +21.5 +22 +22.0 +23 +23.5 +24 +24.5 +25.5 +26 +26.5 +27 +28 +28.5 +29 +29.5 +30 30.5 +31 +31.5 +32 +32.0 +33 +33.5 +34 +34.5 +35 35.5 +36 +36.5 +37 +37.0 +38 +38.5 +39 +39.5 +40 40.5 +41 +41.5 +42 +42.0 +43 +43.5 +44 +44.5 +45 45.5 +46 +46.5 +47 +47.0 +48 +48.5 +49 +49.5 +50 50.0 +51 +51.5 +52 +52.0 +53 +53.5 +54 +54.5 +55 55.5 +56 +56.5 +57 +57.0 +58 +58.5 +59 +59.5 +60 60.0 +61 +61.5 +62 +62.0 +63 +63.5 +64 +64.5 +65 65.5 +66 +66.5 +67 +67.0 +68 +68.5 +69 +69.5 +70 70.5 +71 +71.5 +72 +72.0 +73 +73.5 +74 +74.5 +75 75.5 +76 +76.5 +77 +77.0 +78 +78.5 +79 +79.5 +80 80.0 +81 +81.5 +82 +82.0 +83 +83.5 +84 +84.5 +85 85.5 +86 +86.5 +87 +87.0 +88 +88.5 +89 +89.5 +90 90.0 +91 +91.5 +92 +92.0 +93 +93.5 +94 +94.5 +95 95.0 +96 +96.5 +97 +97.0 +98 +98.5 +99 +99.5 +100 +100.5 +110.0 +110.5 +110.5 +120 +120.5 +121 +121.5 +122 +122.5 +123 +123.5 +124 +124.5 +125 +125.5 +126 +126.5 +127 +127.5 +128 +128.5 +129 +129.5 +130 +130.5 +131 +131.5 +132 +132.5 +133 +133.5 +134 +134.5 +135 +135.5 +136 +136.5 +137 +137.5 +138 +138.5 +139 +139.5 +140 +140.5 +141 \ No newline at end of file diff --git a/olmocr/bench/sample_data/marker/discoverworld_crazy_table4.md b/olmocr/bench/sample_data/marker/discoverworld_crazy_table4_1.md similarity index 100% rename from olmocr/bench/sample_data/marker/discoverworld_crazy_table4.md rename to olmocr/bench/sample_data/marker/discoverworld_crazy_table4_1.md diff --git a/olmocr/bench/sample_data/marker/discoverworld_crazy_table4_2.md b/olmocr/bench/sample_data/marker/discoverworld_crazy_table4_2.md new file mode 100644 index 0000000..07356a2 --- /dev/null +++ b/olmocr/bench/sample_data/marker/discoverworld_crazy_table4_2.md @@ -0,0 +1,63 @@ +Table 4: Baseline model performance on each of the three scoring metrics *(task completion, task process, explanatory knowledge discovery)* across all 24 DISCOVERYWORLD tasks. Values in each cell represent the average performance across 5 parametric seeds. *Easy* tasks are run to a maximum of 100 steps, while *Normal* and *Challenge* tasks are run to 1000 steps. + +| | | | ReACT | | | | Plan+Execute | | | Hypothesizer | | | | +|---------------------------------------------------------------------------|-----------------|-----------------------------------------------|-----------------------------|------|-----------|-------------------------|--------------|-------------------------|------|--------------|-----------|--|--| +| | | | Completion
Procedure | | | Completion
Procedure | | Completion
Procedure | | | | | | +| # | Topic | Task | | | Knowledge | | | Knowledge | | | Knowledge | | | +| | Proteomics | Clustering | | | | | | | | | | | | +| 1 | Easy | Simplified Clustering | 0.87 | 0.20 | 0.20 | 0.80 | 0.00 | 0.00 | 0.90 | 0.40 | 1.00 | | | +| 2 | Normal | Clustering (2D) | 0.88 | 0.40 | 0.40 | 0.68 | 0.20 | 0.00 | 0.93 | 0.40 | 0.40 | | | +| 3 | Challenge | Clustering (3D) | 0.88 | 0.40 | 0.60 | 0.58 | 0.20 | 0.00 | 0.93 | 0.40 | 0.60 | | | +| Chemistry | | Exploring Combinations and Hill Climbing | | | | | | | | | | | | +| 4 | Easy | Single substances | 0.87 | 1.00 | 1.00 | 0.70 | 0.60 | 0.40 | 0.90 | 0.00 | 0.40 | | | +| 5 | Normal | Mix of 3 substances | 0.82 | 0.00 | 0.00 | 0.87 | 0.40 | 0.00 | 0.93 | 0.60 | 0.40 | | | +| 6 | Challenge | Mix of 4 substances | 0.90 | 0.40 | 0.00 | 0.90 | 0.40 | 0.00 | 0.87 | 0.00 | 0.00 | | | +| Archaeology
Correlations | | | | | | | | | | | | | | +| 7 | Easy | Simple instrument | 0.27 | 0.60 | 0.00 | 0.33 | 0.20 | 0.00 | 0.60 | 0.20 | 0.50 | | | +| 8 | Normal | Instrument Use | 0.72 | 0.40 | 0.30 | 0.74 | 0.00 | 0.00 | 0.64 | 0.40 | 0.40 | | | +| 9 | Challenge | Correlation | 0.46 | 0.20 | 0.00 | 0.46 | 0.00 | 0.05 | 0.55 | 0.20 | 0.05 | | | +| | Reactor Lab | Regression | | | | | | | | | | | | +| 10 | Easy | Slope only | 0.42 | 0.00 | 0.40 | 0.44 | 0.00 | 0.10 | 0.38 | 0.00 | 0.20 | | | +| 11 | Normal | Linear regression | 0.44 | 0.00 | 0.20 | 0.49 | 0.00 | 0.00 | 0.51 | 0.00 | 0.00 | | | +| 12 | Challenge | Quadratic regression | 0.43 | 0.00 | 0.20 | 0.39 | 0.00 | 0.00 | 0.39 | 0.00 | 0.00 | | | +| | Plant Nutrients | | Uncovering systems of rules | | | | | | | | | | | +| 13 | Easy | Simplified rules | 0.80 | 0.20 | 0.20 | 0.70 | 0.20 | 0.20 | 0.60 | 0.00 | 0.00 | | | +| 14 | Normal | Presence rules | 0.91 | 0.60 | 0.00 | 0.84 | 0.40 | 0.00 | 0.56 | 0.00 | 0.00 | | | +| 15 | Challenge | Logical Rules | 0.89 | 0.40 | 0.00 | 0.73 | 0.40 | 0.00 | 0.62 | 0.00 | 0.00 | | | +| | Space Sick | Open-ended discovery | | | | | | | | | | | | +| 16 | Easy | Single instrument | 0.78 | 0.60 | 0.00 | 0.68 | 0.40 | 0.10 | 0.80 | 1.00 | 0.60 | | | +| 17 | Normal | Multiple instruments | 0.58 | 0.00 | 0.13 | 0.45 | 0.00 | 0.13 | 0.16 | 0.00 | 0.33 | | | +| 18 | Challenge | Novel instruments | 0.55 | 0.00 | 0.00 | 0.26 | 0.00 | 0.00 | 0.20 | 0.00 | 0.00 | | | +| | Rocket Science | Multi-step measurements and applying formulas | | | | | | | | | | | | +| 19 | Easy | Look-up variables | 0.33 | 0.00 | 0.00 | 0.53 | 0.00 | 0.07 | 0.13 | 0.40 | 0.00 | | | +| 20 | Normal | Measure 2 variables | 0.51 | 0.00 | 0.05 | 0.34 | 0.00 | 0.00 | 0.11 | 0.00 | 0.00 | | | +| 21 | Challenge | Measure 5 variables | 0.43 | 0.00 | 0.00 | 0.15 | 0.00 | 0.00 | 0.22 | 0.00 | 0.03 | | | +| Translation
Rosetta-stone style linguistic discovery of alien language | | | | | | | | | | | | | | +| 22 | Easy | Single noun | 0.40 | 0.40 | 0.20 | 0.30 | 0.00 | 0.00 | 0.20 | 0.20 | 0.00 | | | +| 23 | Normal | Noun and verb | 0.20 | 0.00 | 0.00 | 0.68 | 0.40 | 0.00 | 0.84 | 0.40 | 0.00 | | | +| 24 | Challenge | Noun, adj., and verb | 0.49 | 0.00 | 0.00 | 0.55 | 0.20 | 0.05 | 0.15 | 0.00 | 0.00 | | | +| | Average (Easy) | | | 0.38 | 0.25 | 0.56 | 0.18 | 0.11 | 0.56 | 0.28 | 0.34 | | | +| Average (Normal) | | | 0.59
0.63 | 0.18 | 0.14 | 0.64 | 0.18 | 0.02 | 0.58 | 0.23 | 0.19 | | | +| Average (Challenge) | | | 0.63 | 0.18 | 0.10 | 0.50 | 0.15 | 0.01 | 0.49 | 0.08 | 0.08 | | | +| | | | | | | | | | | | | | | + +Table 5: Baseline model performance on each of the three scoring metrics *(task completion, task process, explanatory knowledge discovery)* across all 10 unit test tasks.Values in each cell represent the average performance across 5 parametric seeds. Unit tests tasks are run to a maximum of 100 steps. + +| | | | ReACT | | Plan+Execute | Hypothesizer | | | +|----|----------------------------------------|-----------|------------|-----------|--------------|--------------|------------|--| +| # | Unit Test Topic | Procedure | Completion | Procedure | Completion | Procedure | Completion | | +| 25 | Multi-turn dialog with an agent | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | | +| 26 | Measure an object with an instrument | 0.87 | 0.60 | 0.73 | 0.40 | 1.00 | 1.00 | | +| 27 | Pick-and-place object | 0.90 | 0.80 | 0.80 | 0.60 | 1.00 | 1.00 | | +| 28 | Pick-and-give object | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | | +| 29 | Read DiscoveryFeed posts | 1.00 | 1.00 | 0.90 | 0.80 | 1.00 | 1.00 | | +| 30 | Move through doors | 0.58 | 0.20 | 0.25 | 0.00 | 0.30 | 0.00 | | +| 31 | Using keys with doors | 0.69 | 0.20 | 0.54 | 0.00 | 0.69 | 0.00 | | +| 32 | Navigate to a specific room in a house | 0.20 | 0.20 | 0.20 | 0.00 | 0.20 | 0.20 | | +| 33 | Search an environment for an object | 0.80 | 0.80 | 0.60 | 0.60 | 1.00 | 1.00 | | +| 34 | Interact with a moving agent | 0.60 | 0.20 | 0.53 | 0.00 | 0.53 | 0.20 | | +| | Average (Unit Tests) | | 0.60 | 0.66 | 0.44 | 0.77 | 0.64 | | + +## 4.2 Baseline Agent Models + +The baseline agents are described below, with model performance on Discovery tasks shown in Table 4, and performance on Unit Tests shown in Table 5. We use the GPT-4O model for all our agents due to its higher performance and lower cost compared to other models. For space we provide \ No newline at end of file diff --git a/olmocr/bench/sample_data/marker/discoverworld_crazy_table4_3.md b/olmocr/bench/sample_data/marker/discoverworld_crazy_table4_3.md new file mode 100644 index 0000000..07356a2 --- /dev/null +++ b/olmocr/bench/sample_data/marker/discoverworld_crazy_table4_3.md @@ -0,0 +1,63 @@ +Table 4: Baseline model performance on each of the three scoring metrics *(task completion, task process, explanatory knowledge discovery)* across all 24 DISCOVERYWORLD tasks. Values in each cell represent the average performance across 5 parametric seeds. *Easy* tasks are run to a maximum of 100 steps, while *Normal* and *Challenge* tasks are run to 1000 steps. + +| | | | ReACT | | | | Plan+Execute | | | Hypothesizer | | | | +|---------------------------------------------------------------------------|-----------------|-----------------------------------------------|-----------------------------|------|-----------|-------------------------|--------------|-------------------------|------|--------------|-----------|--|--| +| | | | Completion
Procedure | | | Completion
Procedure | | Completion
Procedure | | | | | | +| # | Topic | Task | | | Knowledge | | | Knowledge | | | Knowledge | | | +| | Proteomics | Clustering | | | | | | | | | | | | +| 1 | Easy | Simplified Clustering | 0.87 | 0.20 | 0.20 | 0.80 | 0.00 | 0.00 | 0.90 | 0.40 | 1.00 | | | +| 2 | Normal | Clustering (2D) | 0.88 | 0.40 | 0.40 | 0.68 | 0.20 | 0.00 | 0.93 | 0.40 | 0.40 | | | +| 3 | Challenge | Clustering (3D) | 0.88 | 0.40 | 0.60 | 0.58 | 0.20 | 0.00 | 0.93 | 0.40 | 0.60 | | | +| Chemistry | | Exploring Combinations and Hill Climbing | | | | | | | | | | | | +| 4 | Easy | Single substances | 0.87 | 1.00 | 1.00 | 0.70 | 0.60 | 0.40 | 0.90 | 0.00 | 0.40 | | | +| 5 | Normal | Mix of 3 substances | 0.82 | 0.00 | 0.00 | 0.87 | 0.40 | 0.00 | 0.93 | 0.60 | 0.40 | | | +| 6 | Challenge | Mix of 4 substances | 0.90 | 0.40 | 0.00 | 0.90 | 0.40 | 0.00 | 0.87 | 0.00 | 0.00 | | | +| Archaeology
Correlations | | | | | | | | | | | | | | +| 7 | Easy | Simple instrument | 0.27 | 0.60 | 0.00 | 0.33 | 0.20 | 0.00 | 0.60 | 0.20 | 0.50 | | | +| 8 | Normal | Instrument Use | 0.72 | 0.40 | 0.30 | 0.74 | 0.00 | 0.00 | 0.64 | 0.40 | 0.40 | | | +| 9 | Challenge | Correlation | 0.46 | 0.20 | 0.00 | 0.46 | 0.00 | 0.05 | 0.55 | 0.20 | 0.05 | | | +| | Reactor Lab | Regression | | | | | | | | | | | | +| 10 | Easy | Slope only | 0.42 | 0.00 | 0.40 | 0.44 | 0.00 | 0.10 | 0.38 | 0.00 | 0.20 | | | +| 11 | Normal | Linear regression | 0.44 | 0.00 | 0.20 | 0.49 | 0.00 | 0.00 | 0.51 | 0.00 | 0.00 | | | +| 12 | Challenge | Quadratic regression | 0.43 | 0.00 | 0.20 | 0.39 | 0.00 | 0.00 | 0.39 | 0.00 | 0.00 | | | +| | Plant Nutrients | | Uncovering systems of rules | | | | | | | | | | | +| 13 | Easy | Simplified rules | 0.80 | 0.20 | 0.20 | 0.70 | 0.20 | 0.20 | 0.60 | 0.00 | 0.00 | | | +| 14 | Normal | Presence rules | 0.91 | 0.60 | 0.00 | 0.84 | 0.40 | 0.00 | 0.56 | 0.00 | 0.00 | | | +| 15 | Challenge | Logical Rules | 0.89 | 0.40 | 0.00 | 0.73 | 0.40 | 0.00 | 0.62 | 0.00 | 0.00 | | | +| | Space Sick | Open-ended discovery | | | | | | | | | | | | +| 16 | Easy | Single instrument | 0.78 | 0.60 | 0.00 | 0.68 | 0.40 | 0.10 | 0.80 | 1.00 | 0.60 | | | +| 17 | Normal | Multiple instruments | 0.58 | 0.00 | 0.13 | 0.45 | 0.00 | 0.13 | 0.16 | 0.00 | 0.33 | | | +| 18 | Challenge | Novel instruments | 0.55 | 0.00 | 0.00 | 0.26 | 0.00 | 0.00 | 0.20 | 0.00 | 0.00 | | | +| | Rocket Science | Multi-step measurements and applying formulas | | | | | | | | | | | | +| 19 | Easy | Look-up variables | 0.33 | 0.00 | 0.00 | 0.53 | 0.00 | 0.07 | 0.13 | 0.40 | 0.00 | | | +| 20 | Normal | Measure 2 variables | 0.51 | 0.00 | 0.05 | 0.34 | 0.00 | 0.00 | 0.11 | 0.00 | 0.00 | | | +| 21 | Challenge | Measure 5 variables | 0.43 | 0.00 | 0.00 | 0.15 | 0.00 | 0.00 | 0.22 | 0.00 | 0.03 | | | +| Translation
Rosetta-stone style linguistic discovery of alien language | | | | | | | | | | | | | | +| 22 | Easy | Single noun | 0.40 | 0.40 | 0.20 | 0.30 | 0.00 | 0.00 | 0.20 | 0.20 | 0.00 | | | +| 23 | Normal | Noun and verb | 0.20 | 0.00 | 0.00 | 0.68 | 0.40 | 0.00 | 0.84 | 0.40 | 0.00 | | | +| 24 | Challenge | Noun, adj., and verb | 0.49 | 0.00 | 0.00 | 0.55 | 0.20 | 0.05 | 0.15 | 0.00 | 0.00 | | | +| | Average (Easy) | | | 0.38 | 0.25 | 0.56 | 0.18 | 0.11 | 0.56 | 0.28 | 0.34 | | | +| Average (Normal) | | | 0.59
0.63 | 0.18 | 0.14 | 0.64 | 0.18 | 0.02 | 0.58 | 0.23 | 0.19 | | | +| Average (Challenge) | | | 0.63 | 0.18 | 0.10 | 0.50 | 0.15 | 0.01 | 0.49 | 0.08 | 0.08 | | | +| | | | | | | | | | | | | | | + +Table 5: Baseline model performance on each of the three scoring metrics *(task completion, task process, explanatory knowledge discovery)* across all 10 unit test tasks.Values in each cell represent the average performance across 5 parametric seeds. Unit tests tasks are run to a maximum of 100 steps. + +| | | | ReACT | | Plan+Execute | Hypothesizer | | | +|----|----------------------------------------|-----------|------------|-----------|--------------|--------------|------------|--| +| # | Unit Test Topic | Procedure | Completion | Procedure | Completion | Procedure | Completion | | +| 25 | Multi-turn dialog with an agent | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | | +| 26 | Measure an object with an instrument | 0.87 | 0.60 | 0.73 | 0.40 | 1.00 | 1.00 | | +| 27 | Pick-and-place object | 0.90 | 0.80 | 0.80 | 0.60 | 1.00 | 1.00 | | +| 28 | Pick-and-give object | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | | +| 29 | Read DiscoveryFeed posts | 1.00 | 1.00 | 0.90 | 0.80 | 1.00 | 1.00 | | +| 30 | Move through doors | 0.58 | 0.20 | 0.25 | 0.00 | 0.30 | 0.00 | | +| 31 | Using keys with doors | 0.69 | 0.20 | 0.54 | 0.00 | 0.69 | 0.00 | | +| 32 | Navigate to a specific room in a house | 0.20 | 0.20 | 0.20 | 0.00 | 0.20 | 0.20 | | +| 33 | Search an environment for an object | 0.80 | 0.80 | 0.60 | 0.60 | 1.00 | 1.00 | | +| 34 | Interact with a moving agent | 0.60 | 0.20 | 0.53 | 0.00 | 0.53 | 0.20 | | +| | Average (Unit Tests) | | 0.60 | 0.66 | 0.44 | 0.77 | 0.64 | | + +## 4.2 Baseline Agent Models + +The baseline agents are described below, with model performance on Discovery tasks shown in Table 4, and performance on Unit Tests shown in Table 5. We use the GPT-4O model for all our agents due to its higher performance and lower cost compared to other models. For space we provide \ No newline at end of file diff --git a/olmocr/bench/sample_data/marker/lincoln_letter_1.md b/olmocr/bench/sample_data/marker/lincoln_letter_1.md new file mode 100644 index 0000000..d953e7d --- /dev/null +++ b/olmocr/bench/sample_data/marker/lincoln_letter_1.md @@ -0,0 +1,3 @@ +necuhve Mansion Vastington amany layor Seneral Hitchcocks Commissioner of Cachanges, is anthonged and directed to offer Bingadier General Trin prisoner of war in Fort Inctienny, in exchange now w Major White, who is held as a preises at Richmond Ite is also directed to vand forwards the offer of exchange by Stenny in. Warfield, Eag. of Baltimore, under aflag 11 mice, and give him apass to tity Point. Abrakan Sincolus + +![](_page_0_Picture_1.jpeg) \ No newline at end of file diff --git a/olmocr/bench/sample_data/marker/mattsnotes_1.md b/olmocr/bench/sample_data/marker/mattsnotes_1.md new file mode 100644 index 0000000..7ec4df5 --- /dev/null +++ b/olmocr/bench/sample_data/marker/mattsnotes_1.md @@ -0,0 +1,5 @@ +February Flow Data Components Code The stack V2 Codetext SE whatever we've scraped Webtext HQOCLM DATA MIXES 85 Source code Deepseek 0 Codetext cider 5 Webtext 85 The stack V2 1590 Cedetext Jstaceder 2 n 0 webtext loose source code Arctic + +P1 1090 Source code Granite P2 80 code 20 language Code Data Recipe staceder 1 Order by Repo 2 call Heristic filters 3 Group by Reporting minhash 4 Pack into Repo level does Δ 5 Select PL's Δ i D Pack into FIM tokens X Eng Done not critical Eng definitively NOT done D so so easy use Preprocessed codetext web text + +ARCH TRAINING Pick Arch like OLMO 18 or replicate a 30 model Follow standard LR flow Eval Hacky nonsense for now \ No newline at end of file diff --git a/olmocr/bench/sample_data/marker/multi_column_miss.md b/olmocr/bench/sample_data/marker/multi_column_miss_1.md similarity index 100% rename from olmocr/bench/sample_data/marker/multi_column_miss.md rename to olmocr/bench/sample_data/marker/multi_column_miss_1.md diff --git a/olmocr/bench/sample_data/marker/multi_column_miss_2.md b/olmocr/bench/sample_data/marker/multi_column_miss_2.md new file mode 100644 index 0000000..75460de --- /dev/null +++ b/olmocr/bench/sample_data/marker/multi_column_miss_2.md @@ -0,0 +1,19 @@ +Advocacy in Action 447 + +stakeholders has occurred in other nations, with groups and individuals refusing to risk being appropriated into the industry's public relations ambitions. It now looks like that with vigilance, toa realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company's deliberations on the matter, and the company's perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +........................................................................... + +Correspondence to: Dr Norbert Hirschhorn, Nastolantie 6, A3 00600 Helsinki, Finland; bertzpoet@yahoo.com + +....................... + +Received 13 November 2003 Accepted 15 July 2004 ....................... Over the past three decades increasing pressure from non-governmental organisations (NGOs), governments and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as ''corporate social responsibility'' (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics, or as an irretrievably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +## CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT + +The term ''corporate social responsibility'' is in vogue at the moment but as a concept it is vague and means different things to different people.1 + +Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of ''noblesse oblige''. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century.2 3 The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of + +Abbreviations: ASH, Action on Smoking and Health; BAT, British American Tobacco; CERES, Coalition for Environmentally Responsible Economies; CSR, corporate social responsibility; DJSI, Dow Jones Sustainability Index; GCAC, Global Corporate Affairs Council; GRI, Global Reporting Initiative; MSA, Master Settlement Agreement; NGOs, non-governmental organisations; PM, Philip Morris; TNCs, transnational corporations; UNEP, United Nations Environment Program \ No newline at end of file diff --git a/olmocr/bench/sample_data/marker/multi_column_miss_3.md b/olmocr/bench/sample_data/marker/multi_column_miss_3.md new file mode 100644 index 0000000..4fb2c9b --- /dev/null +++ b/olmocr/bench/sample_data/marker/multi_column_miss_3.md @@ -0,0 +1,21 @@ +Advocacy in Action 447 + +stakeholders has occurred in other nations, with groups and individuals refusing to risk being appropriated into the industry's public relations ambitions. It now looks like that with vigilance, tobacco control advocates can easily foment similar distaste in many areas of the business community. Our actions sought to denormalise the tobacco industry by disrupting its efforts to take its place alongside other industries—often with considerable social credit—in the hope that it might gain by association. + +Tobacco industry posturing about its corporate responsibility can never hide the ugly consequences of its ongoing efforts to ''work with all relevant stakeholders for the preservation of opportunities for informed adults to consume tobacco products''1 (tranehaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +........................................................................... + +Correspondence to: Dr Norbert Hirschhorn, Nastolantie 6, A3 00600 Helsinki, Finland; bertzpoet@yahoo.com + +....................... + +Received 13 November 2003 Accepted 15 July 2004 ....................... Over the past three decades increasing pressure from non-governmental organisations (NGOs), governments and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as ''corporate social responsibility'' (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics, or as an irretrievably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +## CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT + +The term ''corporate social responsibility'' is in vogue at the moment but as a concept it is vague and means different things to different people.1 + +Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of ''noblesse oblige''. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century.2 3 The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of + +Abbreviations: ASH, Action on Smoking and Health; BAT, British American Tobacco; CERES, Coalition for Environmentally Responsible Economies; CSR, corporate social responsibility; DJSI, Dow Jones Sustainability Index; GCAC, Global Corporate Affairs Council; GRI, Global Reporting Initiative; MSA, Master Settlement Agreement; NGOs, non-governmental organisations; PM, Philip Morris; TNCs, transnational corporations; UNEP, United Nations Environment Program \ No newline at end of file diff --git a/olmocr/bench/sample_data/marker/olmo2-pg4_1.md b/olmocr/bench/sample_data/marker/olmo2-pg4_1.md new file mode 100644 index 0000000..7b2bb42 --- /dev/null +++ b/olmocr/bench/sample_data/marker/olmo2-pg4_1.md @@ -0,0 +1,25 @@ +| Source | Type | Tokens | Words | Bytes | Docs | +|-------------------------------------------------|------------------|--------|-------|--------|-------| +| Pretraining ✦
OLMo 2 1124 Mix | | | | | | +| DCLM-Baseline | Web pages | 3.71T | 3.32T | 21.32T | 2.95B | +| StarCoder
filtered version
from OLMoE Mix | Code | 83.0B | 70.0B | 459B | 78.7M | +| peS2o
from Dolma 1.7 | Academic papers | 58.6B | 51.1B | 413B | 38.8M | +| arXiv | STEM papers | 20.8B | 19.3B | 77.2B | 3.95M | +| OpenWebMath | Math web pages | 12.2B | 11.1B | 47.2B | 2.89M | +| Algebraic Stack | Math proofs code | 11.8B | 10.8B | 44.0B | 2.83M | +| Wikipedia & Wikibooks
from Dolma 1.7 | Encyclopedic | 3.7B | 3.16B | 16.2B | 6.17M | +| Total | | 3.90T | 3.48T | 22.38T | 3.08B | + +**Table 1 Composition of the pretraining data for OLMo 2**. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., 2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki come from Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajama (Together AI, 2023), while OpenWebMath (Paster et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). + +## **2.1.1 Pretraining data: OLMo 2 Mix 1124** + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over 95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the "baseline 1.0 " mix.4 From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +## **2.1.2 Mid-training data: Dolmino Mix 1124** + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which Dolmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/marker/openstax_caculus_pg_273_1.md b/olmocr/bench/sample_data/marker/openstax_caculus_pg_273_1.md new file mode 100644 index 0000000..c783867 --- /dev/null +++ b/olmocr/bench/sample_data/marker/openstax_caculus_pg_273_1.md @@ -0,0 +1,58 @@ +## **3.4 EXERCISES** + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +- a. Find the velocity and acceleration functions. +- b. Determine the time intervals when the object is slowing down or speeding up. + +$$150. \quad s(t) = 2t^3 - 3t^2 - 12t + 8$$ + +$$151. \quad s(t) = 2t^3 - 15t^2 + 36t - 10t$$ + +$$152. \quad s(t) = \frac{t}{1+t^2}$$ + +153. A rocket is fired vertically upward from the ground. The distance *s* in feet that the rocket travels from the ground after *t* seconds is given by *s*(*t*) = −16*t* 2 + 560*t*. + +- a. Find the velocity of the rocket 3 seconds after being fired. +- b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/ s from the top of a 64-foot-tall building. After *t* seconds, its height above the ground is given by *s*(*t*) = −16*t* 2 − 8*t* + 64. + +- a. Determine how long it takes for the ball to hit the ground. +- b. Determine the velocity of the ball when it hits the ground. + +155. The position function *s*(*t*) = *t* 2 − 3*t* − 4 represents the position of the back of a car backing out of a driveway and then driving in a straight line, where *s* is in feet and *t* is in seconds. In this case, *s*(*t*) = 0 represents the time at which the back of the car is at the garage door, so *s*(0) = −4 is the starting position of the car, 4 feet inside the garage. + +- a. Determine the velocity of the car when *s*(*t*) = 0. +- b. Determine the velocity of the car when *s*(*t*) = 14. + +156. The position of a hummingbird flying along a straight line in *t* seconds is given by *s*(*t*) = 3*t* 3 − 7*t* meters. + +- a. Determine the velocity of the bird at *t* = 1 sec. +- b. Determine the acceleration of the bird at *t* = 1 sec. +- c. Determine the acceleration of the bird when the velocity equals 0. + +157. A potato is launched vertically upward with an initial velocity of 100 ft/s from a potato gun at the top of an 85-foot-tall building. The distance in feet that the potato travels from the ground after *t* seconds is given by + +*s*(*t*) = −16*t* 2 + 100*t* + 85. + +- a. Find the velocity of the potato after 0.5 s and 5.75 s. +- b. Find the speed of the potato at 0.5 s and 5.75 s. +- c. Determine when the potato reaches its maximum height. +- d. Find the acceleration of the potato at 0.5 s and 1.5 s. +- e. Determine how long the potato is in the air. +- f. Determine the velocity of the potato upon hitting the ground. + +158. The position function *s*(*t*) = *t* 3 − 8*t* gives the position in miles of a freight train where east is the positive direction and *t* is measured in hours. + +- a. Determine the direction the train is traveling when *s*(*t*) = 0. +- b. Determine the direction the train is traveling when *a*(*t*) = 0. +- c. Determine the time intervals when the train is slowing down or speeding up. + +159. The following graph shows the position *y* = *s*(*t*) of an object moving along a straight line. + +![](_page_0_Figure_34.jpeg) + +- negative, or zero. b. Sketch the graph of the velocity function. +- c. Use the graph of the velocity function to determine the time intervals when the acceleration is positive, negative, or zero. +- d. Determine the time intervals when the object is speeding up or slowing down. \ No newline at end of file diff --git a/olmocr/bench/sample_data/mineru/discoverworld_crazy_table4.md b/olmocr/bench/sample_data/mineru/discoverworld_crazy_table4_1.md similarity index 100% rename from olmocr/bench/sample_data/mineru/discoverworld_crazy_table4.md rename to olmocr/bench/sample_data/mineru/discoverworld_crazy_table4_1.md diff --git a/olmocr/bench/sample_data/mineru/lincoln_letter_1.md b/olmocr/bench/sample_data/mineru/lincoln_letter_1.md new file mode 100644 index 0000000..d67137e --- /dev/null +++ b/olmocr/bench/sample_data/mineru/lincoln_letter_1.md @@ -0,0 +1 @@ +![](tmpgz41xbv8/92aad94c4fc9c5b80db131bf1f9dfacb1f43a27b1620e89dd78f5b225dcfd6f9.jpg) \ No newline at end of file diff --git a/olmocr/bench/sample_data/mineru/mattsnotes_1.md b/olmocr/bench/sample_data/mineru/mattsnotes_1.md new file mode 100644 index 0000000..3b8a68e --- /dev/null +++ b/olmocr/bench/sample_data/mineru/mattsnotes_1.md @@ -0,0 +1,13 @@ +![](tmpvc9u9f45/931edd4f8177771a0cbfbe983ca5c1e35c7971ccb4336c337b78a0fab9d15801.jpg) + +![](tmpvc9u9f45/85cebc5d7bc37a1eb140233e856278039bfec714487f664cfcd6804ca9e16532.jpg) + +![](tmpvc9u9f45/bb608c0041f8f724353c4d7c95a4384c344e6926f07c38c76a503e030c73e8cd.jpg) + +![](tmpvc9u9f45/82e1d6d688ef85a33d4077529ce0b8729a172074de68011ad9c3105e1f8a39e1.jpg) + +![](tmpvc9u9f45/dedbeed09f2078a5d4d4e8b217d8ae117198231f5e53b223ac34280af8f03c94.jpg) + +![](tmpvc9u9f45/27d3b5cb772e24e202d5344349c5acf19b1253c2f6f2b4f2ca398b6993b91d25.jpg) + +![](tmpvc9u9f45/20b196376219aaeb4d913dbdc6a8118f650a9e0264b314cd2a155372e1b530a7.jpg) \ No newline at end of file diff --git a/olmocr/bench/sample_data/mineru/multi_column_miss.md b/olmocr/bench/sample_data/mineru/multi_column_miss_1.md similarity index 100% rename from olmocr/bench/sample_data/mineru/multi_column_miss.md rename to olmocr/bench/sample_data/mineru/multi_column_miss_1.md diff --git a/olmocr/bench/sample_data/mineru/olmo2-pg4_1.md b/olmocr/bench/sample_data/mineru/olmo2-pg4_1.md new file mode 100644 index 0000000..a2d2584 --- /dev/null +++ b/olmocr/bench/sample_data/mineru/olmo2-pg4_1.md @@ -0,0 +1,13 @@ +
SourceTypeTokensWordsBytesDocs
Pretraining ← OLMo 2 1124 Mix
DCLM-BaselineWeb pages3.71T3.32T21.32T2.95B
StarCoder filtered version from OLMoE MixCode83.0B70.0B459B78.7M
peS2o from Dolma 1.7Academicpapers58.6B51.1B413B38.8M
arXivSTEM papers20.8B19.3B77.2B3.95M
OpenWebMathMath web pages12.2B11.1B47.2B2.89M
Algebraic StackMath proofs code11.8B10.8B44.0B2.83M
Wikipedia & Wikibooks from Dolma 1.7Encyclopedic3.7B3.16B16.2B6.17M
Total3.90T3.48T22.38T3.08B
+ +# 2.1.1 Pretraining data: OLMo 2 Mix 1124 + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over $95\%$ derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the “baseline 1.0 ” mix.4 From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over $50\%$ of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +# 2.1.2 Mid-training data: Dolmino Mix 1124 + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which Dolmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/mineru/openstax_caculus_pg_273_1.md b/olmocr/bench/sample_data/mineru/openstax_caculus_pg_273_1.md new file mode 100644 index 0000000..1503e99 --- /dev/null +++ b/olmocr/bench/sample_data/mineru/openstax_caculus_pg_273_1.md @@ -0,0 +1,52 @@ +# 3.4 EXERCISES + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +a. Find the velocity and acceleration functions. b. Determine the time intervals when the object is slowing down or speeding up. + +150. $s(t)=2t^{3}-3t^{2}-12t+8$ +151. $s(t)=2t^{3}-15t^{2}+36t-10$ +152. $s(t)=\frac{t}{1+t^{2}}$ + +153. A rocket is fired vertically upward from the ground. The distance $s$ in feet that the rocket travels from the ground after $t$ seconds is given by $s(t)=-16t^{2}+560t,$ . + +a. Find the velocity of the rocket 3 seconds after being fired. +b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/ s from the top of a 64-foot-tall building. After $t$ seconds, its height above the ground is given by $s(t)=-16t^{2}-8t+64.$ . + +a. Determine how long it takes for the ball to hit the ground. +b. Determine the velocity of the ball when it hits the ground. + +155. The position function $s(t)=t^{2}-3t-4$ represents the position of the back of a car backing out of a driveway and then driving in a straight line, where $s$ is in feet and $t$ is in seconds. In this case, $s(t)=0$ represents the time at which the back of the car is at the garage door, so $s(0)=-4$ is the starting position of the car, 4 feet inside the garage. + +a. Determine the velocity of the car when $s(t)=0$ . +b. Determine the velocity of the car when $s(t)=14$ . + +156. The position of a hummingbird flying along a straight line in $t$ seconds is given by $s(t)=3t^{3}-7t$ meters. + +a. Determine the velocity of the bird at $t=1$ sec. b. Determine the acceleration of the bird at $t=1$ sec. c. Determine the acceleration of the bird when the velocity equals 0. + +157. A potato is launched vertically upward with an initial velocity of 100 ft/s from a potato gun at the top of an 85-foot-tall building. The distance in feet that the potato travels from the ground after $t$ seconds is given by $s(t)=-16t^{2}+100t+85.$ . + +a. Find the velocity of the potato after $0.5\:\mathrm{s}$ and $5.75s$ . +b. Find the speed of the potato at $0.5s$ and $5.75s$ . +c. Determine when the potato reaches its maximum height. +d. Find the acceleration of the potato at 0.5 s and 1.5 s. +e. Determine how long the potato is in the air. +f. Determine the velocity of the potato upon hitting the ground. + +158. The position function $s(t)=t^{3}-8t$ gives the position in miles of a freight train where east is the positive direction and $t$ is measured in hours. + +a. Determine the direction the train is traveling when $s(t)=0$ . +b. Determine the direction the train is traveling when $a(t)=0$ . +c. Determine the time intervals when the train is slowing down or speeding up. + +159. The following graph shows the position $y=s(t)$ of an object moving along a straight line. + +![](tmpajaekj0s/208dd5f404fd99b27696f09a5f4ceb0dffdf86f4e3594a872c99afa173c80bf8.jpg) + +a. Use the graph of the position function to determine the time intervals when the velocity is positive, negative, or zero. +b. Sketch the graph of the velocity function. +c. Use the graph of the velocity function to determine the time intervals when the acceleration is positive, negative, or zero. +d. Determine the time intervals when the object is speeding up or slowing down. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4.md b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4.md deleted file mode 100644 index c23aff5..0000000 --- a/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4.md +++ /dev/null @@ -1,52 +0,0 @@ -Table 4: Baseline model performance on each of the three scoring metrics (task completion, task process, explanatory knowledge discovery) across all 24 DISCOVERY WORLD tasks. Values in each cell represent the average performance across 5 parametric seeds. Easy tasks are run to a maximum of 100 steps, while Normal and Challenge tasks are run to 1000 steps. - -| # | Topic | Task | ReACT | Plan+Execute | Hypothesizer | -|---|-----------------|-----------------------|-----------|--------------|--------------| -| | | | Pressure | Completion | Knowledge | Pressure | Completion | Knowledge | -| 1 | Proteomics | Clustering | 0.87 | 0.20 | 0.20 | 0.80 | 0.00 | 0.00 | 0.90 | 0.40 | 1.00 | -| 2 | Chemistry | Exploring Combinations and Hill Climbing | 0.89 | 0.40 | 0.00 | 0.89 | 0.20 | 0.00 | 0.95 | 0.40 | 0.60 | -| 3 | Archaeology | Correlations | 0.90 | 0.40 | 0.00 | 0.90 | 0.40 | 0.00 | 0.95 | 0.60 | 0.40 | -| 4 | Reactor Lab | Regression | 0.91 | 0.60 | 0.00 | 0.94 | 0.40 | 0.00 | 0.87 | 0.00 | 0.00 | -| 5 | Plant Nutrients | Uncovering systems of rules | 0.91 | 0.40 | 0.00 | 0.91 | 0.40 | 0.00 | 0.87 | 0.00 | 0.00 | -| 6 | Space Sick | Open-ended discovery | 0.78 | 0.60 | 0.00 | 0.78 | 0.40 | 0.10 | 0.80 | 1.00 | 0.60 | -| 7 | Archaeology | Correlations | 0.89 | 0.40 | 0.00 | 0.90 | 0.40 | 0.00 | 0.55 | 0.20 | 0.03 | -| 8 | Plant Nutrients | Uncovering systems of rules | 0.91 | 0.60 | 0.00 | 0.91 | 0.40 | 0.00 | 0.55 | 0.20 | 0.03 | -| 9 | Space Sick | Open-ended discovery | 0.78 | 0.60 | 0.00 | 0.78 | 0.40 | 0.10 | 0.80 | 1.00 | 0.60 | -| 10| Easy | Simplified Clustering | 0.42 | 0.00 | 0.40 | 0.44 | 0.00 | 0.10 | 0.38 | 0.00 | 0.20 | -| 11| Normal | Linear regression | 0.44 | 0.00 | 0.20 | 0.49 | 0.00 | 0.00 | 0.51 | 0.00 | 0.00 | -| 12| Challenge | Quadratic regression | 0.43 | 0.00 | 0.20 | 0.39 | 0.00 | 0.00 | 0.39 | 0.00 | 0.00 | -| 13| Easy | Simplified Clustering | 0.80 | 0.20 | 0.20 | 0.70 | 0.20 | 0.20 | 0.60 | 0.00 | 0.00 | -| 14| Normal | Presence rules | 0.91 | 0.60 | 0.00 | 0.84 | 0.40 | 0.00 | 0.56 | 0.00 | 0.00 | -| 15| Challenge | Logical Rules | 0.89 | 0.40 | 0.00 | 0.73 | 0.40 | 0.00 | 0.62 | 0.00 | 0.00 | -| 16| Easy | Single instrument | 0.78 | 0.60 | 0.00 | 0.68 | 0.40 | 0.10 | 0.80 | 1.00 | 0.60 | -| 17| Normal | Multiple instruments | 0.58 | 0.00 | 0.13 | 0.45 | 0.00 | 0.13 | 0.16 | 0.00 | 0.33 | -| 18| Challenge | Novel instruments | 0.55 | 0.00 | 0.00 | 0.26 | 0.00 | 0.00 | 0.20 | 0.00 | 0.00 | -| 19| Easy | Look-up variables | 0.33 | 0.00 | 0.00 | 0.53 | 0.00 | 0.07 | 0.13 | 0.40 | 0.00 | -| 20| Normal | Measure 2 variables | 0.51 | 0.00 | 0.05 | 0.34 | 0.00 | 0.00 | 0.11 | 0.00 | 0.00 | -| 21| Challenge | Measure 5 variables | 0.43 | 0.00 | 0.00 | 0.15 | 0.00 | 0.00 | 0.22 | 0.00 | 0.03 | -| 22| Easy | Single noun | 0.40 | 0.40 | 0.20 | 0.30 | 0.00 | 0.00 | 0.20 | 0.20 | 0.00 | -| 23| Normal | Noun and verb | 0.20 | 0.00 | 0.00 | 0.68 | 0.40 | 0.00 | 0.54 | 0.40 | 0.00 | -| 24| Challenge | Noun, adj., and verb | 0.49 | 0.00 | 0.00 | 0.55 | 0.20 | 0.05 | 0.15 | 0.00 | 0.00 | -| | Average (Easy) | | 0.59 | 0.38 | 0.25 | 0.56 | 0.18 | 0.11 | 0.56 | 0.28 | 0.34 | -| | Average (Normal)| | 0.63 | 0.18 | 0.14 | 0.64 | 0.18 | 0.02 | 0.58 | 0.23 | 0.19 | -| | Average (Challenge) | | 0.63 | 0.18 | 0.10 | 0.50 | 0.15 | 0.01 | 0.49 | 0.08 | 0.08 | - -Table 5: Baseline model performance on each of the three scoring metrics (task completion, task process, explanatory knowledge discovery) across all 10 unit test tasks. Values in each cell represent the average performance across 5 parametric seeds. Unit tests tasks are run to a maximum of 100 steps. - -| # | Unit Test Topic | ReACT | Plan+Execute | Hypothesizer | -|---|-----------------|-------|--------------|--------------| -| | | Pressure | Completion | Knowledge | Pressure | Completion | Knowledge | Pressure | Completion | Knowledge | -| 25| Multi-turn dialog with an agent | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | -| 26| Measure an object with an instrument | 0.87 | 0.60 | 0.73 | 0.40 | 1.00 | 1.00 | -| 27| Pick-and-place object | 0.90 | 0.80 | 0.80 | 0.60 | 1.00 | 1.00 | -| 28| Read Discovery/Feed posts | 1.00 | 1.00 | 0.90 | 0.80 | 1.00 | 1.00 | -| 29| Move through doors | 0.58 | 0.20 | 0.25 | 0.00 | 0.30 | 0.00 | -| 30| Using keys with doors | 0.69 | 0.20 | 0.54 | 0.00 | 0.69 | 0.00 | -| 31| Navigate to a specific room in a house | 0.20 | 0.20 | 0.20 | 0.00 | 0.20 | 0.20 | -| 32| Search an environment for an object | 0.80 | 0.80 | 0.60 | 0.60 | 1.00 | 1.00 | -| 33| Interact with a moving agent | 0.60 | 0.20 | 0.53 | 0.00 | 0.53 | 0.20 | -| | Average (Unit Tests) | 0.76 | 0.60 | 0.66 | 0.44 | 0.77 | 0.64 | - -4.2 Baseline Agent Models - -The baseline agents are described below, with model performance on Discovery tasks shown in Table 4, and performance on Unit Tests shown in Table 5. We use the GPT-4G model for all our agents due to its higher performance and lower cost compared to other models. For space we provide \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_1.md b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_1.md new file mode 100644 index 0000000..318bd7d --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_1.md @@ -0,0 +1 @@ +Error: JSONDecodeError - Unterminated string starting at: line 1 column 125 (char 124) \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_2.md b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_2.md new file mode 100644 index 0000000..46456f8 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_2.md @@ -0,0 +1 @@ +Error: JSONDecodeError - Unterminated string starting at: line 1 column 126 (char 125) \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_3.md b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_3.md new file mode 100644 index 0000000..46456f8 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_3.md @@ -0,0 +1 @@ +Error: JSONDecodeError - Unterminated string starting at: line 1 column 126 (char 125) \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_4.md b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_4.md new file mode 100644 index 0000000..46456f8 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_4.md @@ -0,0 +1 @@ +Error: JSONDecodeError - Unterminated string starting at: line 1 column 126 (char 125) \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_5.md b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_5.md new file mode 100644 index 0000000..108bece --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/discoverworld_crazy_table4_5.md @@ -0,0 +1,50 @@ +Table 4: Baseline model performance on each of the three scoring metrics (task completion, task process, explanatory knowledge discovery) across all 24 DISCOVERY WORLD tasks. Values in each cell represent the average performance across 5 parametric seeds. Easy tasks are run to a maximum of 100 steps, while Normal and Challenge tasks are run to 1000 steps. + +| # | Topic | Task | ReACT Completion | Plan+Execute Completion | Hypothesizer Completion | +|---|----------------------------|---------------------------|------------------|-------------------------|-------------------------| +| 1 | Proteomics | Clustering | 0.87 0.20 0.20 | 0.80 0.00 0.00 | 0.90 0.40 1.00 | +| 2 | Normal | Clustering (2D) | 0.88 0.40 0.40 | 0.68 0.20 0.00 | 0.93 0.40 0.40 | +| 3 | Easy | Clustering (3D) | 0.88 0.40 0.60 | 0.55 0.20 0.00 | 0.93 0.40 0.60 | +| 4 | Chemistry | Exploring Combinations | 0.87 1.00 1.00 | 0.70 0.60 0.40 | 0.90 0.40 0.40 | +| 5 | Normal | Single substances | 0.82 0.00 0.00 | 0.87 0.40 0.00 | 0.93 0.40 0.40 | +| 6 | Challenge | Mix of 4 substances | 0.90 0.40 0.00 | 0.90 0.40 0.00 | 0.97 0.00 0.00 | +| 7 | Archaeology | Correlations | 0.27 0.60 0.00 | 0.33 0.20 0.00 | 0.60 0.20 0.50 | +| 8 | Easy | Simple instrument | 0.72 0.40 0.30 | 0.74 0.00 0.00 | 0.64 0.40 0.40 | +| 9 | Challenge | Correlation | 0.46 0.20 0.00 | 0.46 0.00 0.05 | 0.55 0.20 0.05 | +| 10 | Reactor Lab | Regression | 0.42 0.00 0.40 | 0.44 0.00 0.10 | 0.38 0.00 0.20 | +| 11 | Normal | Linear regression | 0.44 0.00 0.20 | 0.49 0.00 0.00 | 0.51 0.00 0.00 | +| 12 | Challenge | Quadratic regression | 0.43 0.00 0.20 | 0.39 0.00 0.00 | 0.39 0.00 0.00 | +| 13 | Normal | Simple rules | 0.91 0.60 0.00 | 0.84 0.40 0.00 | 0.56 0.40 0.00 | +| 14 | Challenge | Logical Rules | 0.89 0.40 0.00 | 0.73 0.40 0.00 | 0.62 0.00 0.00 | +| 15 | Normal | Uncovering systems of rules | 0.80 0.20 0.20 | 0.70 0.20 0.20 | 0.60 0.00 0.00 | +| 16 | Challenge | Quadratic regression | 0.43 0.00 0.20 | 0.39 0.00 0.00 | 0.39 0.00 0.00 | +| 17 | Normal | Presence rules | 0.55 0.00 0.00 | 0.26 0.00 0.00 | 0.20 0.00 0.00 | +| 18 | Challenge | Novel instruments | 0.58 0.00 0.13 | 0.45 0.00 0.13 | 0.16 0.00 0.33 | +| 19 | Normal | Multi-step measurements | 0.55 0.00 0.00 | 0.34 0.00 0.00 | 0.11 0.00 0.00 | +| 20 | Challenge | Applying formulas | 0.51 0.00 0.05 | 0.51 0.00 0.05 | 0.22 0.00 0.03 | +| 21 | Normal | Look-up variables | 0.43 0.00 0.00 | 0.33 0.00 0.00 | 0.20 0.20 0.00 | +| 22 | Challenge | Multiple instruments | 0.55 0.00 0.00 | 0.34 0.00 0.00 | 0.11 0.00 0.00 | +| 23 | Normal | Novel instruments | 0.55 0.00 0.00 | 0.26 0.00 0.00 | 0.20 0.00 0.00 | +| 24 | Challenge | Novel instruments | 0.55 0.00 0.00 | 0.26 0.00 0.00 | 0.20 0.00 0.00 | +| 25 | Average (Easy) | | 0.59 0.38 0.25 | 0.56 0.18 0.11 | 0.56 0.28 0.34 | +| 26 | Average (Normal) | | 0.63 0.18 0.14 | 0.64 0.18 0.02 | 0.58 0.23 0.19 | +| 27 | Average (Challenge) | | 0.63 0.18 0.10 | 0.50 0.15 0.01 | 0.49 0.08 0.08 | + +Table 5: Baseline model performance on each of the three scoring metrics (task completion, task process, explanatory knowledge discovery) across all 10 unit test tasks. Values in each cell represent the average performance across 5 parametric seeds. Unit tests tasks are run to a maximum of 100 steps. + +| # | Unit Test Topic | ReACT Completion | Plan+Execute Completion | Hypothesizer Completion | +|---|------------------------------------------------------|------------------|-------------------------|-------------------------| +| 25 | Multi-turn dialog with an agent | 1.00 1.00 1.00 | 1.00 1.00 1.00 | 1.00 1.00 1.00 | +| 26 | Measure an object with an instrument | 0.87 0.60 0.73 | 0.40 0.00 0.00 | 1.00 1.00 1.00 | +| 27 | Pick-and-place object | 0.90 0.80 0.80 | 0.80 0.60 0.60 | 1.00 1.00 1.00 | +| 28 | Read DiscoveryFeed posts | 1.00 1.00 1.00 | 0.90 0.80 0.80 | 1.00 1.00 1.00 | +| 29 | Move through doors | 0.58 0.20 0.67 | 0.25 0.00 0.00 | 0.30 0.00 0.00 | +| 30 | Using keys with doors | 0.67 0.20 0.53 | 0.00 0.00 0.00 | 0.69 0.00 0.00 | +| 31 | Navigate to a specific room in a house | 0.20 0.20 0.20 | 0.20 0.00 0.00 | 0.20 0.20 0.20 | +| 32 | Search an environment for an object | 0.80 0.80 0.80 | 0.60 0.60 0.60 | 1.00 1.00 1.00 | +| 33 | Interact with a moving agent | 0.60 0.20 0.53 | 0.00 0.00 0.00 | 0.53 0.20 0.20 | +| 34 | Average (Unit Tests) | 0.76 0.60 0.66 | 0.44 0.44 0.44 | 0.77 0.64 0.64 | + +4.2 Baseline Agent Models + +The baseline agents are described below, with model performance on Discovery tasks shown in Table 4, and performance on Unit Tests shown in Table 5. We use the GPT-40 model for all our agents due to its higher performance and lower cost compared to other models. For space we provide... \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/lincoln_letter_1.md b/olmocr/bench/sample_data/olmocr/lincoln_letter_1.md new file mode 100644 index 0000000..6c1dd7f --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/lincoln_letter_1.md @@ -0,0 +1,9 @@ +Executive Mansion, + +Washington City, + +January 15th, 1864 + +Major General Hitchcock, Commissioner of Exchanges, is authorized and directed to offer Brigadier General Trimble, now a prisoner of war in Fort McHenry, in exchange for Major White, who is held as a prisoner at Richmond. He is also directed to send forward the offer of exchange by Henry M. Warfield, Esq. of Baltimore, under a flag of truce, and give him a pass to City Point. + +Abraham Lincoln \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/lincoln_letter_2.md b/olmocr/bench/sample_data/olmocr/lincoln_letter_2.md new file mode 100644 index 0000000..73d6089 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/lincoln_letter_2.md @@ -0,0 +1,11 @@ +Executive Mansion, + +Washington City, + +January 15th, 1864 + +Major General Hitchcock, Commissioner of Exchanges, is authorized and directed to offer Brigadier General Trimble, now a prisoner of war in Fort McHenry, in exchange for Major White, who is held as a prisoner at Richmond. + +He is also directed to send forward the offer of exchange by Henry M. Warfield, Esq. of Baltimore, under a flag of truce, and give him a pass to City Point. + +Abraham Lincoln \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/lincoln_letter_3.md b/olmocr/bench/sample_data/olmocr/lincoln_letter_3.md new file mode 100644 index 0000000..70ec504 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/lincoln_letter_3.md @@ -0,0 +1,9 @@ +Executive Mansion, + +Washington City, + +January 15th, 1864 + +Major General Hitchcock, Commissioner of Exchanges, is authorized and directed to offer Brigadier General Trimble, now a prisoner of war in Fort McHenry, in exchange for Major White, who is held as a prisoner at Richmond. He is also directed to send forward the offer of exchange by Henry Wm. Marfield, Esq. of Baltimore, under a flag of truce, and give him a pass to City Point. + +Abraham Lincoln \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/lincoln_letter_4.md b/olmocr/bench/sample_data/olmocr/lincoln_letter_4.md new file mode 100644 index 0000000..7955d51 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/lincoln_letter_4.md @@ -0,0 +1,9 @@ +Executive Mansion, + +Washington City, + +January 15th, 1864 + +Major General Hitchcock, Commissioner of Exchange, is authorized and directed to offer Brigadier General Trimble, now a prisoner of war in Fort McHenry, in exchange for Major White, who is held as a prisoner at Richmond. He is also directed to send forward the offer of exchange by Henry M. Ward, Esq. of Baltimore, under a flag of truce, and give him a pass to City Point. + +Abraham Lincoln \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/lincoln_letter_5.md b/olmocr/bench/sample_data/olmocr/lincoln_letter_5.md new file mode 100644 index 0000000..73d6089 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/lincoln_letter_5.md @@ -0,0 +1,11 @@ +Executive Mansion, + +Washington City, + +January 15th, 1864 + +Major General Hitchcock, Commissioner of Exchanges, is authorized and directed to offer Brigadier General Trimble, now a prisoner of war in Fort McHenry, in exchange for Major White, who is held as a prisoner at Richmond. + +He is also directed to send forward the offer of exchange by Henry M. Warfield, Esq. of Baltimore, under a flag of truce, and give him a pass to City Point. + +Abraham Lincoln \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/mattsnotes_1.md b/olmocr/bench/sample_data/olmocr/mattsnotes_1.md new file mode 100644 index 0000000..aaa86e7 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/mattsnotes_1.md @@ -0,0 +1,30 @@ +V-February Flow + +Data Components: + +Code: +- The-Stack-V2 + +CodeText: +- SE, whatever we've scraped + +WebText: +- HQ DCLM + +DATA MIXES + +~85% Source Code +~10% CodeText +~5% WebText + +~85% The-Stack-V2 +~15% CodeText +~0% WebText + +~100% Source Code + +DeepSeek Coder + +StarCoder 2 + +Arctic \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/mattsnotes_2.md b/olmocr/bench/sample_data/olmocr/mattsnotes_2.md new file mode 100644 index 0000000..7c63417 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/mattsnotes_2.md @@ -0,0 +1,30 @@ +V-February Flow + +Data Components: + +Code: +- The-Stack-V2 + +CodeText: +- SE, whatever we’ve scraped + +WebText: +- HA DCLM + +DATA MIXES + +~85% Source Code +~15% CodeText +~0% Webtext + +~85% The-stack-V2 +~15% CodeText +~0% Webtext + +~100% Source Code + +Deepseek Coder + +StarCoder + +Arctic \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/mattsnotes_3.md b/olmocr/bench/sample_data/olmocr/mattsnotes_3.md new file mode 100644 index 0000000..cf15c47 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/mattsnotes_3.md @@ -0,0 +1,30 @@ +V-February Flow + +Data Components: + +Code: +- The-Stack-V2 + +CodeText: +- SE, whatever we've scraped + +WebText: +- HQ DCLM + +DATA MIXES + +\(~85\%\) Source Code +\(~10\%\) CodeText +\(~5\%\) Webtext + +\(~85\%\) The-stack-V2 +\(~15\%\) CodeText +\(~0\%\) Webtext + +\(~100\%\) Source Code + +DeepSeek Coder + +StarCoder 2 + +Arctic \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/mattsnotes_4.md b/olmocr/bench/sample_data/olmocr/mattsnotes_4.md new file mode 100644 index 0000000..f165aeb --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/mattsnotes_4.md @@ -0,0 +1,24 @@ +V-February Flow + +Data Components: + +Code: +The-Stack-V2 + +CodeText: +SE, whatever we've scraped + +WebText: +HQ DCLM + +DATA MIXES + +~ 85% Source Code} Deepseek Coder +~ 10% CodeText +~ 5% WebText + +~ 85% The-stack-V2} StarCoder 2 +~ 15% CodeText +~ 0% WebText + +~ 100% Source Code} Arctic \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/mattsnotes_5.md b/olmocr/bench/sample_data/olmocr/mattsnotes_5.md new file mode 100644 index 0000000..ec88e4f --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/mattsnotes_5.md @@ -0,0 +1,30 @@ +V-February Flow + +Data Components: + +Code: +The-Stack-V2 + +CodeText: +SE, whatever we've scraped + +WebText: +HQ DCLM + +DATA MIXES + +~85% Source Code +~10% CodeText +~5% Webtext + +~85% The-stack-V2 +~15% CodeText +~0% Webtext + +~100% Source Code + +Deepseek Coder + +UserCoder 2 + +Arctic \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/multi_column_miss.md b/olmocr/bench/sample_data/olmocr/multi_column_miss.md deleted file mode 100644 index 3797e59..0000000 --- a/olmocr/bench/sample_data/olmocr/multi_column_miss.md +++ /dev/null @@ -1,9 +0,0 @@ -stakeholders has occurred in other nations, with groups and individuals refusing to risk being appropriated into the industry’s public relations ambitions. It now looks like that with vigilance, tobacco control advocates can easily foment antithetical to social responsibility. Behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. - -Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company’s deliberations on the matter, and the company’s perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. - -OVER THE PAST THREE DECADES INCREASING PRESSURE FROM NON-GOVERNMENTAL ORGANISATIONS (NGOs), GOVERNMENTS AND THE UNITED NATIONS, HAS REQUIRED TRANSNATIONAL CORPORATIONS (TNCs) TO EXAMINE AND REDRESS THE ADVERSE IMPACT THEIR BUSINESSES HAVE ON SOCIETY AND THE ENVIRONMENT. MANY HAVE RESPONDED BY TAKING UP WHAT IS KNOWN AS “CORPORATE SOCIAL RESPONSIBILITY” (CSR); ONLY RECENTLY HAVE TWO MAJOR CIGARETTE COMPANIES FOLLOWED SUIT: PHILIP MORRIS (PM) AND BRITISH AMERICAN TOBACCO (BAT). THIS REPORT FIRST PROVIDES THE CONTEXT AND DEVELOPMENT OF CSR; THEN, FROM INTERNAL COMPANY DOCUMENTS, EXAMINES HOW PM CAME TO ITS OWN VERSION. THIS PAPER EXAMINES WHETHER A TOBACCO COMPANY ESPousing CSR SHOULD BE JUDGED SIMPLY AS A CORPORATE ENTITY ALONG STANDARDS OF BUSINESS ETHICS, OR AS AN INERIevably negative force in the realm of public health, thereby rendering CSR an oxymoron. - -CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT - -The term “corporate social responsibility” is in vogue at the moment but as a concept it is vague and means different things to different people. Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of “noblese oblige”. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century. The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of power. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/multi_column_miss_1.md b/olmocr/bench/sample_data/olmocr/multi_column_miss_1.md new file mode 100644 index 0000000..9b24d67 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/multi_column_miss_1.md @@ -0,0 +1,26 @@ +stakeholders has occurred in other nations, with groups and individuals refusing to risk being appropriated into the industry’s public relations ambitions. It now looks like that with vigilance, tobacco control advocates can easily foment similar distaste in many areas of the business community. Our actions sought to denormalise the tobacco industry by disrupting its efforts to take its place alongside other industries—often with considerable social credit—in the hope that it might gain by association. + +The tobacco industry posturing about its corporate responsibility can never hide the ugly consequences of its ongoing efforts to “work with all relevant stakeholders for the preservation of opportunities for informed adults to consume tobacco products” (translation: “we will build alliances with others who want to profit from tobacco use, to do all we can to counteract effective tobacco control”). BAT has 15.4% and Philip Morris 16.4% of the global cigarette market. With 4.9 million smokers currently dying from tobacco use each year, and the industry unblinkingly concurring that its products are addictive, this leaves BAT to argue why it should not be held to be largely accountable for the annual deaths of some 754 600 smokers, and Philip Morris some 803 600 smokers. + +REFERENCES +1 British American Tobacco. Social Report. http://www.bat.com/204pp +2 Wroe D. Tobacco ad campaign angers MPs. The Age (Melbourne) 2004; May 17 http://www.thegage.com.au/articles/2004/05/16/10844646691771.html?oneclick=true +3 Hirschhorn N. Corporate social responsibility and the tobacco industry: hope or hype? Tobacco Control 2004;13:447–53. +4 Ethical Corporation Asia 2004. Conference website. http://www.ethicalcorp.com/asia2004/ +5 Chapman S, Shatenstein S. Extreme corporate makeover: tobacco companies, corporate responsibility and the corruption of “ethics”. Globalink petition. http://petition.globalink.org/view.php?code=extreme. +6 Mackay J, Erikson M. The tobacco atlas: Geneva: World Health Organization, 2002. + +INDUSTRY WATCH +Corporate social responsibility and the tobacco industry: hope or hype? +N Hirschhorn + +Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company’s deliberations on the matter, and the company’s perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +Over the past three decades increasing pressure from non-governmental organisations (NGOs), governments, and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as “corporate social responsibility” (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics, or as an irrevocably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT +The term “corporate social responsibility” is in vogue at the moment but as a concept it is vague and means different things to different people. + +Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of “noblese oblige”. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century. The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of + +Abbreviations: ASH, Action on Smoking and Health; BAT, British American Tobacco; CERES, Coalition for Environmentally Responsible Economies; CSR, corporate social responsibility; DJSI, Dow Jones Sustainability Index; GCAC, Global Corporate Affairs Council; GRI, Global Reporting Initiative; MSA, Master Settlement Agreement; NGOs, non-governmental organisations; PM, Philip Morris; TNCs, transnational corporations; UNEP, United Nations Environment Program \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/multi_column_miss_2.md b/olmocr/bench/sample_data/olmocr/multi_column_miss_2.md new file mode 100644 index 0000000..996ae30 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/multi_column_miss_2.md @@ -0,0 +1,34 @@ +stakeholders has occurred in other nations, with groups and individuals refusing to risk being appropriated into the industry’s public relations ambitions. It now looks like that with vigilance, tobacco control advocates can easily foment disruption of its ongoing efforts to “work with all relevant stakeholders for the preservation of opportunities for informed adults to consume tobacco products” (translation: “we will build alliances with others who want to profit from tobacco use, to do all we can to counteract effective tobacco control”). BAT has 15.4% and Philip Morris 16.4% of the global cigarette market. With 4.9 million smokers currently dying from tobacco use each year, and the industry unblinkingly concurring that its products are addictive, this leaves BAT to argue why it should not be held to be largely accountable for the annual deaths of some 754 600 smokers, and Philip Morris some 803 600 smokers. + +REFERENCES +1 British American Tobacco. Social Report. http://www.bat.com/204pp +2 Wroe D. Tobacco ad campaign angers MPs. The Age (Melbourne) 2004, May 17 http://www.theage.com.au/articles/2004/05/17/1084646669771.html?tonedclick=true +3 Hirschhorn N. Corporate social responsibility and the tobacco industry: hope or hype? Tobacco Control 2004;13:447–53. +4 Ethical Corporation Asia 2004. Conference website. http://www.ethicalcorp.com/asia2004/ +5 Chapman S, Shatenstein S. Extreme corporate makeover: tobacco companies, corporate responsibility and the corruption of “ethics”. Globalink petition. http://petition.globalink.org/view.php?codex=extreme +6 Mackay J, Eriksen M. The tobacco atlas. Geneva: World Health Organization, 2002. + +INDUSTRY WATCH + +Corporate social responsibility and the tobacco industry: hope or hype? + +N Hirschhorn + +Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company’s deliberations on the matter, and the company’s perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +Over the past three decades increasing pressure from non-governmental organisations (NGOs), governments and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as “corporate social responsibility” (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics, or as an irrefutably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT + +The term “corporate social responsibility” is in vogue at the moment but as a concept it is vague and means different things to different people. Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of “noblesse oblige”. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century. The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of + +Abbreviations: ASH, Action on Smoking and Health; BAT, British American Tobacco; CERES, Coalition for Environmentally Responsible Economies; CSR, corporate social responsibility; DJSI, Dow Jones Sustainability Index; GCAC, Global Corporate Affairs Council; GRI, Global Reporting Initiative; MSA, Master Settlement Agreement; NGOs, non-governmental organisations; PM, Philip Morris; TNCs, transnational corporations; UNEP, United Nations Environment Program + +Correspondence to: Dr Norbert Hirschhorn, Nastolantie 6, A 00600 Helsinki, Finland; bertzoepf@yahoo.com + +Received 13 November 2003 +Accepted 15 July 2004 + +Tobacco Control 2004;13:447–453. doi: 10.1136/tc.2003.006676 + +www.tobaccocontrol.com \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/multi_column_miss_3.md b/olmocr/bench/sample_data/olmocr/multi_column_miss_3.md new file mode 100644 index 0000000..e7d932b --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/multi_column_miss_3.md @@ -0,0 +1,38 @@ +advocacy in action 447 + +tobacco products''1 (translation: ''we will build alliances with preservation of opportunities for informed adults to consume efforts to ''work with all relevant stakeholders for the ongoing industriesthe tobacco industry by disrupting its efforts to take its place alongside other industries—often with considerable social credit—in the hope that it might gain by association. + +Tobacco industry posturing about its corporate responsibility can never hide the ugly consequences of its ongoing efforts to ''work with all relevant stakeholders for the preservation of opportunities for informed adults to consume tobacco products''1 (translation: ''we will build alliances with others who want to profit from tobacco use, to do all we can to counteract effective tobacco control''). BAT has 15.4% and Philip Morris 16.4% of the global cigarette market.6 With 4.9 million smokers currently dying from tobacco use each year, and the industry unblinkingly concurring that its products are addictive, this leaves BAT to argue why it should not be held to be largely accountable for the annual deaths of some 754 600 smokers, and Philip Morris some 803 600 smokers. + +references +1 British American Tobacco. Social Report. http://www.bat.com/204pp +2 Wroe D. Tobacco ad campaign angers MPs. The Age (Melbourne) 2004; May 17 http://www.theage.com.au/articles/2004/05/16/108464669771.html +3 Hirschhorn N. Corporate social responsibility and the tobacco industry: hope or hype? Tobacco Control 2004;13:447–53. +4 Ethical Corporation Asia 2004. Conference website. http://www.ethicalcorp.com/asia2004/ +5 Chapman S, Shatenstein S. Extreme corporate makeover: tobacco companies, corporate responsibility and the corruption of ''ethics''. Globalink petition. http://petition.globalink.org/view.php?code=extreme. +6 Mackay J, Eriksen M. The tobacco atlas. Geneva: World Health Organization, 2002. + +industry watch + +Corporate social responsibility and the tobacco industry: hope or hype? + +N Hirschhorn + +Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company’s deliberations on the matter, and the company’s perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +over the past three decades increasing pressure from non-governmental organisations (NGOs), governments, and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as ‘‘corporate social responsibility’’ (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity according to standards of business ethics, or as an irretrievably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +corporate social responsibility: the context + +The term ‘‘corporate social responsibility’’ is in vogue at the moment but as a concept it is vague and means different things to different people.1 + +Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of ‘‘noblesse oblige’’. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century.2 The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of + +abbreviations: ASH, Action on Smoking and Health; BAT, British American Tobacco; CERES, Coalition for Environmentally Responsible Economies; CSR, corporate social responsibility; DJSI, Dow Jones Sustainability Index; GCAC, Global Corporate Affairs Council; GRI, Global Reporting Initiative; MSA, Master Settlement Agreement; NGOs, non-governmental organisations; PM, Philip Morris; TNCs, transnational corporations; UNEP, United Nations Environment Program + +Correspondence to: Dr Norbert Hirschhorn, Nastolantie 6, A3 00600 Helsinki, Finland; bertzpoef@yahoo.com + +Received 13 November 2003 +Accepted 15 July 2004 + +www.tobaccocontrol.com \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/multi_column_miss_4.md b/olmocr/bench/sample_data/olmocr/multi_column_miss_4.md new file mode 100644 index 0000000..71ebe86 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/multi_column_miss_4.md @@ -0,0 +1,26 @@ +stakeholders has occurred in other nations, with groups and individuals refusing to risk being appropriated into the industry’s public relations ambitions. It now looks like that with vigilance, tobacco control advocates can easily foment similar distaste in many areas of the business community. Our actions sought to denormalise the tobacco industry by disrupting its efforts to take its place alongside other industries—often with considerable social credit—in the hope that it might gain by association. + +Tobacco industry posturing about its corporate responsibility can never hide the ugly consequences of its ongoing efforts to “work with all relevant stakeholders for the preservation of opportunities for informed adults to consume tobacco products” (translation: “we will build alliances with others who want to profit from tobacco use, to do all we can to counteract effective tobacco control”). BAT has 15.4% and Philip Morris 16.4% of the global cigarette market. With 4.9 million smokers currently dying from tobacco use each year, and the industry unblinkingly concurring that its products are addictive, this leaves BAT to argue why it should not be held to be largely accountable for the annual deaths of some 754,600 smokers, and Philip Morris some 803,600 smokers. + +**REFERENCES** + +1. British American Tobacco. Social Report. http://www.bat.com/204pp +2. Wroe D. Tobacco ad campaign angers MPs. The Age (Melbourne) 2004; May 17 http://www.theage.com.au/articles/2004/05/16/108464669771.html?toneclick=true +3. Hirschhorn N. Corporate social responsibility and the tobacco industry: hope or hype? Tobacco Control 2004;13:447–53. +4. Ethical Corporation Asia 2004. Conference website. http://www.ethicalcorp.com/asia2004/ +5. Chapman S, Shatenstein S. Extreme corporate makeover: tobacco companies, corporate responsibility and the corruption of “ethics”. Globalink petition. http://petition.globalink.org/view.php?code=extreme. +6. Mackay J, Erikson M. The tobacco atlas. Geneva: World Health Organization, 2002. + +**INDUSTRY WATCH** + +Corporate social responsibility and the tobacco industry: hope or hype? + +N Hirschhorn + +Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company’s deliberations on the matter, and the company’s perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +Over the past three decades increasing pressure from non-governmental organisations (NGOs), governments and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as “corporate social responsibility” (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics, or as an irretrievably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +**CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT** + +The term “corporate social responsibility” is in vogue at the moment but as a concept it is vague and means different things to different people. Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of “noblese oblige”. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century. The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of... \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/multi_column_miss_5.md b/olmocr/bench/sample_data/olmocr/multi_column_miss_5.md new file mode 100644 index 0000000..b8ababf --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/multi_column_miss_5.md @@ -0,0 +1,17 @@ +Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company’s deliberations on the matter, and the company’s perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +Corporations have been under increased pressure from non-governmental organisations (NGOs), governments, and the United Nations, to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as “corporate social responsibility” (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics, or as an irrefutably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +**INDUSTRY WATCH** + +Corporate social responsibility and the tobacco industry: hope or hype? + +N Hirschhorn + +Corporate social responsibility (CSR) emerged from a realisation among transnational corporations of the need to account for and redress their adverse impact on society: specifically, on human rights, labour practices, and the environment. Two transnational tobacco companies have recently adopted CSR: Philip Morris, and British American Tobacco. This report explains the origins and theory behind CSR; examines internal company documents from Philip Morris showing the company’s deliberations on the matter, and the company’s perspective on its own behaviour; and reflects on whether marketing tobacco is antithetical to social responsibility. + +Over the past three decades increasing pressure from non-governmental organisations (NGOs), governments, and the United Nations, has required transnational corporations (TNCs) to examine and redress the adverse impact their businesses have on society and the environment. Many have responded by taking up what is known as “corporate social responsibility” (CSR); only recently have two major cigarette companies followed suit: Philip Morris (PM) and British American Tobacco (BAT). This report first provides the context and development of CSR; then, from internal company documents, examines how PM came to its own version. This paper examines whether a tobacco company espousing CSR should be judged simply as a corporate entity along standards of business ethics, or as an irrefutably negative force in the realm of public health, thereby rendering CSR an oxymoron. + +**CORPORATE SOCIAL RESPONSIBILITY: THE CONTEXT** + +The term “corporate social responsibility” is in vogue at the moment but as a concept it is vague and means different things to different people. Some writers on CSR trace its American roots to the 19th century when large industries engaged in philanthropy and established great public institutions, a form of “noblesse oblige”. But the notion that corporations should be required to return more to society because of their impact on society was driven by pressures from the civil rights, peace, and environmental movements of the last half century. The unprecedented expansion of power and influence of TNCs over the past three decades has accelerated global trade and development, but also environmental damage and abuses of... \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/olmo2-pg4_1.md b/olmocr/bench/sample_data/olmocr/olmo2-pg4_1.md new file mode 100644 index 0000000..837b53e --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/olmo2-pg4_1.md @@ -0,0 +1,28 @@ +| Source | Type | Tokens | Words | Bytes | Docs | +|-------------------------------|--------------------|---------|--------|---------|-------| +| DCLM-Baseline | Web pages | 3.71T | 3.32T | 21.32T | 2.95B | +| StarCoder | Code | 83.0B | 70.0B | 459B | 78.7M | +| filtered version | | | | | | +| from OLMoE Mix | | | | | | +| peS2o | Academic papers | 58.6B | 51.1B | 413B | 38.8M | +| from Dolma 1.7 | | | | | | +| arXiv | STEM papers | 20.8B | 19.3B | 77.2B | 3.95M | +| OpenWebMath | Math web pages | 12.2B | 11.1B | 47.2B | 2.89M | +| Algebraic Stack | Math proofs code | 11.8B | 10.8B | 44.0B | 2.83M | +| Wikipedia & Wikibooks | Encyclopedic | 3.7B | 3.16B | 16.2B | 6.17M | +| from Dolma 1.7 | | | | | | +| Total | | 3.90T | 3.48T | 22.38T | 3.08B | + +Table 1: Composition of the pretraining data for OLMo 2 Mix 1124. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., 2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki come from Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajama (Together AI, 2023), while OpenWebMath (Paster et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). + +2.1.1 Pretraining data: OLMo 2 Mix 1124 + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over 95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the “baseline 1.0” mix. From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +2.1.2 Mid-training data: Dolmino Mix 1124 + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which Dolmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/olmo2-pg4_2.md b/olmocr/bench/sample_data/olmocr/olmo2-pg4_2.md new file mode 100644 index 0000000..eb5c20c --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/olmo2-pg4_2.md @@ -0,0 +1,13 @@ +Table 1 Composition of the pretraining data for OLMo2. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., 2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki come from Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajama (Together AI, 2023), while OpenWebMath (Paster et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). + +2.1.1 Pretraining data: OLMo 2 Mix 1124 + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over 95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the “baseline 1.0” mix. From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +2.1.2 Mid-training data: Dolmino Mix 1124 + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as DOLMino MIX 1124. The base sources from which DOLMino MIX 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/olmo2-pg4_3.md b/olmocr/bench/sample_data/olmocr/olmo2-pg4_3.md new file mode 100644 index 0000000..7fe1e0c --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/olmo2-pg4_3.md @@ -0,0 +1,13 @@ +Table 1 Composition of the pretraining data for OLMo 2. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., 2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki come from Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajama (Together AI, 2023), while OpenWebMath (Paster et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). + +2.1.1 Pretraining data: OLMo 2 Mix 1124 + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over 95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the “baseline 1.0” mix. From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +2.1.2 Mid-training data: Dolmino Mix 1124 + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which Dolmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/olmo2-pg4_4.md b/olmocr/bench/sample_data/olmocr/olmo2-pg4_4.md new file mode 100644 index 0000000..a1c9b21 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/olmo2-pg4_4.md @@ -0,0 +1,25 @@ +Table 1 Composition of the pretraining data for OLMo 2. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., 2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki come from Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajama (Together AI, 2023), while OpenWebMath (Paster et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). + +| Source | Type | Tokens | Words | Bytes | Docs | +|-------------------------|--------------------------|----------|---------|---------|--------| +| DCLM-Baseline | Web pages | 3.71T | 3.32T | 21.32T | 2.95B | +| StarCoder | Code | 83.0B | 70.0B | 459B | 78.7M | +| StarCoder filtered version from OLMoE Mix | Academic papers | 58.6B | 51.1B | 413B | 38.8M | +| peS2o from Dolma 1.7 | Academic papers | 58.6B | 51.1B | 413B | 38.8M | +| arXiv | STEM papers | 20.8B | 19.3B | 77.2B | 3.95M | +| OpenWebMath | Math web pages | 12.2B | 11.1B | 47.2B | 2.89M | +| Algebraic Stack | Math proofs code | 11.8B | 10.8B | 44.0B | 2.83M | +| Wikipedia & Wikibooks | Encyclopedic | 3.7B | 3.16B | 16.2B | 6.17M | +| Total | | 3.90T | 3.48T | 22.38T | 3.08B | + +2.1.1 Pretraining data: OLMo 2 Mix 1124 + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over 95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the “baseline 1.0” mix. From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +2.1.2 Mid-training data: Dolmino Mix 1124 + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which Dolmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/olmo2-pg4_5.md b/olmocr/bench/sample_data/olmocr/olmo2-pg4_5.md new file mode 100644 index 0000000..d03c74c --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/olmo2-pg4_5.md @@ -0,0 +1,27 @@ +Table 1: Composition of the pretraining data for OLMo 2 + +| Source | Type | Tokens | Words | Bytes | Docs | +|------------------------------|-----------------------|-----------|----------|----------|---------| +| Pretraining + OLMo 2 1124 Mix| | | | | | +| DCLM-Baseline | Web pages | 3.71T | 3.32T | 21.32T | 2.95B | +| StarCoder | Code | 83.0B | 70.0B | 459B | 78.7M | +| peS2o from Dolma 1.7 | Academic papers | 58.6B | 51.1B | 413B | 38.8M | +| arXiv | STEM papers | 20.8B | 19.3B | 77.2B | 3.95M | +| OpenWebMath | Math web pages | 12.2B | 11.1B | 47.2B | 2.89M | +| Algebraic Stack | Math proofs code | 11.8B | 10.8B | 44.0B | 2.83M | +| Wikipedia & Wikibooks from Dolma 1.7 | Encyclopedic | 3.7B | 3.16B | 16.2B | 6.17M | +| Total | | 3.90T | 3.48T | 22.38T | 3.08B | + +Table 1 Composition of the pretraining data for OLMo 2. The OLMo 2 1124 Mix is composed of StarCoder (Li et al., 2023b; Kocetkov et al., 2022), peS2o (Soldaini and Lo, 2023), web text from DCLM (Li et al., 2024) and Wiki from Dolma 1.7 (Soldaini et al., 2024). arXiv comes from Red-Pajama (Together AI, 2023), while OpenWebMath (Paster et al., 2023) and Algebraic Stack come from ProofPile II (Azerbayev et al., 2023). + +2.1.1 Pretraining data: OLMo 2 Mix 1124 + +The mix used for this stage is shown in Table 1. It consists of approximately 3.9 trillion tokens, with over 95% derived from web data. We refer to this set as OLMo 2 Mix 1124. This is the same pretraining data used in OLMoE (Muennighoff et al., 2024). + +We combine data from DCLM (Li et al., 2024) and Dolma 1.7 (Soldaini et al., 2024). From DCLM, we use the “baseline 1.0” mix. From Dolma, we use the arXiv (Together AI, 2023), OpenWebMath (Paster et al., 2023), Algebraic Stack, peS2o (Soldaini and Lo, 2023), and Wikipedia subsets. arXiv, OpenWebMath, and Algebraic Stack were originally part of ProofPile II (Azerbayev et al., 2023). + +Finally, we include code from StarCoder (Li et al., 2023b), which is derived from permissively-licensed repositories from GitHub (Kocetkov et al., 2022). In an attempt to include higher quality code, we remove any document from a repository with fewer than 2 stars on GitHub. Further, through manual inspection of this source, we found it to contain documents encoded in binary format or containing mostly numerical content; to remove them, we discarded documents whose most frequent word constitutes over 30% of the document, or whose top-2 most frequent words constitute over 50% of the document. To mitigate possible training loss spikes, we remove documents with repeated sequences of 32 or more n-grams. We report details and show effectiveness of this intervention in Section §3.1. + +2.1.2 Mid-training data: Dolmino Mix 1124 + +After the initial pretraining stage on mostly web data, we further train with a mixture of web data that has been more restrictively filtered for quality and a collection of domain-specific high quality data, much of which is synthetic. The purpose of this mixture is to imbue the model with math-centric skills and provide focused exposure to STEM references and high quality text. We generate several variants of this mixture, with varying sizes, but generally refer to this mixture as Dolmino Mix 1124. The base sources from which Dolmino Mix 1124 is subsampled are described in Table 2. We refer the reader to Section §4 for a deep dive detailing our processes for experimenting and curating data for this mix. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_1.md b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_1.md new file mode 100644 index 0000000..14f01c1 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_1.md @@ -0,0 +1,39 @@ +3.4 EXERCISES + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +a. Find the velocity and acceleration functions. +b. Determine the time intervals when the object is slowing down or speeding up. + +150. \( s(t) = 2t^3 - 3t^2 - 12t + 8 \) +151. \( s(t) = 2t^3 - 15t^2 + 36t - 10 \) +152. \( s(t) = \frac{t}{1 + t^2} \) + +153. A rocket is fired vertically upward from the ground. The distance \( s \) in feet that the rocket travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 560t \). + +a. Find the velocity of the rocket 3 seconds after being fired. +b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/s from the top of a 64-foot-tall building. After \( t \) seconds, its height above the ground is given by \( s(t) = -16t^2 - 8t + 64 \). + +a. Determine how long it takes for the ball to hit the ground. +b. Determine the velocity of the ball when it hits the ground. + +155. The position function \( s(t) = t^2 - 3t - 4 \) represents the position of the back of a car backing out of a driveway and then driving in a straight line, where \( s \) is in feet and \( t \) is in seconds. In this case, \( s(t) = 0 \) represents the time at which the back of the car is at the garage door, so \( s(0) = -4 \) is the starting position of the car, 4 feet inside the garage. + +a. Determine the velocity of the car when \( s(t) = 0 \). +b. Determine the velocity of the car when \( s(t) = 14 \). + +156. The position of a hummingbird flying along a straight line in \( t \) seconds is given by \( s(t) = 3t^3 - 7t \) meters. + +a. Determine the velocity of the bird at \( t = 1 \) sec. +b. Determine the acceleration of the bird at \( t = 1 \) sec. +c. Determine the acceleration of the bird when the velocity equals 0. + +d. Determine the time intervals when the object is speeding up or slowing down. + +d. Determine the time intervals when the object is slowing down or speeding up. + +d. Determine the time intervals when the object is slowing down or speeding up. + +d. Determine the time intervals when the object is slowing down or speeding up. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_2.md b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_2.md new file mode 100644 index 0000000..2ef6bd4 --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_2.md @@ -0,0 +1,73 @@ +3.4 EXERCISES + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +a. Find the velocity and acceleration functions. + +b. Determine the time intervals when the object is slowing down or speeding up. + +150. \( s(t) = 2t^3 - 3t^2 - 12t + 8 \) + +151. \( s(t) = 2t^3 - 15t^2 + 36t - 10 \) + +152. \( s(t) = \frac{t}{1 + t^2} \) + +153. A rocket is fired vertically upward from the ground. The distance \( s \) in feet that the rocket travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 560t \). + +a. Find the velocity of the rocket 3 seconds after being fired. + +b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/s from the top of a 64-foot-tall building. After \( t \) seconds, its height above the ground is given by \( s(t) = -16t^2 - 8t + 64 \). + +a. Determine how long it takes for the ball to hit the ground. + +b. Determine the velocity of the ball when it hits the ground. + +155. The position function \( s(t) = t^2 - 3t - 4 \) represents the position of the back of a car backing out of a driveway and then driving in a straight line, where \( s \) is in feet and \( t \) is in seconds. In this case, \( s(t) = 0 \) represents the time at which the back of the car is at the garage door, so \( s(0) = -4 \) is the starting position of the car, 4 feet inside the garage. + +a. Determine the velocity of the car when \( s(t) = 0 \). + +b. Determine the velocity of the car when \( s(t) = 14 \). + +156. The position of a hummingbird flying along a straight line in \( t \) seconds is given by \( s(t) = 3t^3 - 7t \) meters. + +a. Determine the velocity of the bird at \( t = 1 \) sec. + +b. Determine the acceleration of the bird at \( t = 1 \) sec. + +c. Determine the acceleration of the bird when the velocity equals 0. + +157. A potato is launched vertically upward with an initial velocity of 100 ft/s from a potato gun at the top of an 85-foot-tall building. The distance in feet that the potato travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 100t + 85 \). + +a. Find the velocity of the potato after 0.5 s and 5.75 s. + +b. Find the speed of the potato at 0.5 s and 5.75 s. + +c. Determine when the potato reaches its maximum height. + +d. Find the acceleration of the potato at 0.5 s and 1.5 s. + +e. Determine how long the potato is in the air. + +f. Determine the velocity of the potato upon hitting the ground. + +158. The position function \( s(t) = t^3 - 8t \) gives the position in miles of a freight train where east is the positive direction and \( t \) is measured in hours. + +a. Determine the direction the train is traveling when \( s(t) = 0 \). + +b. Determine the direction the train is traveling when \( s(t) = 0 \). + +c. Determine the time intervals when the train is slowing down or speeding up. + +159. The following graph shows the position \( y = s(t) \) of an object moving along a straight line. + +![Graph of the position function](image) + +a. Use the graph of the position function to determine the time intervals when the velocity is positive, negative, or zero. + +b. Sketch the graph of the velocity function. + +c. Use the graph of the velocity function to determine the time intervals when the acceleration is positive, negative, or zero. + +d. Determine the time intervals when the object is speeding up or slowing down. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_3.md b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_3.md new file mode 100644 index 0000000..746e56d --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_3.md @@ -0,0 +1,73 @@ +3.4 EXERCISES + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +a. Find the velocity and acceleration functions. + +b. Determine the time intervals when the object is slowing down or speeding up. + +150. \( s(t) = 2t^3 - 3t^2 - 12t + 8 \) + +151. \( s(t) = 2t^3 - 15t^2 + 36t - 10 \) + +152. \( s(t) = \frac{t}{1 + t^2} \) + +153. A rocket is fired vertically upward from the ground. The distance \( s \) in feet that the rocket travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 560t \). + +a. Find the velocity of the rocket 3 seconds after being fired. + +b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/s from the top of a 64-foot-tall building. After \( t \) seconds, its height above the ground is given by \( s(t) = -16t^2 - 8t + 64 \). + +a. Determine how long it takes for the ball to hit the ground. + +b. Determine the velocity of the ball when it hits the ground. + +155. The position function \( s(t) = t^2 - 3t - 4 \) represents the position of the back of a car backing out of a driveway and then driving in a straight line, where \( s \) is in feet and \( t \) is in seconds. In this case, \( s(t) = 0 \) represents the time at which the back of the car is at the garage door, so \( s(0) = -4 \) is the starting position of the car, 4 feet inside the garage. + +a. Determine the velocity of the car when \( s(t) = 0 \). + +b. Determine the velocity of the car when \( s(t) = 14 \). + +156. The position of a hummingbird flying along a straight line in \( t \) seconds is given by \( s(t) = 3t^3 - 7t \) meters. + +a. Determine the velocity of the bird at \( t = 1 \) sec. + +b. Determine the acceleration of the bird at \( t = 1 \) sec. + +c. Determine the acceleration of the bird when the velocity equals 0. + +157. A potato is launched vertically upward with an initial velocity of 100 ft/s from a potato gun at the top of an 85-foot-tall building. The distance in feet that the potato travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 100t + 85 \). + +a. Find the velocity of the potato after 0.5 s and 5.75 s. + +b. Find the speed of the potato at 0.5 s and 5.75 s. + +c. Determine when the potato reaches its maximum height. + +d. Find the acceleration of the potato at 0.5 s and 1.5 s. + +e. Determine how long the potato is in the air. + +f. Determine the velocity of the potato upon hitting the ground. + +158. The position function \( s(t) = t^3 - 8t \) gives the position in miles of a freight train where east is the positive direction and \( t \) is measured in hours. + +a. Determine the direction the train is traveling when \( s(t) = 0 \). + +b. Determine the direction the train is traveling when \( s(t) = 0 \). + +c. Determine the time intervals when the train is slowing down or speeding up. + +159. The following graph shows the position \( y = s(t) \) of an object moving along a straight line. + +[Graph image] + +a. Use the graph of the position function to determine the time intervals when the velocity is positive, negative, or zero. + +b. Sketch the graph of the velocity function. + +c. Use the graph of the velocity function to determine the time intervals when the acceleration is positive, negative, or zero. + +d. Determine the time intervals when the object is speeding up or slowing down. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_4.md b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_4.md new file mode 100644 index 0000000..0895d9f --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_4.md @@ -0,0 +1,73 @@ +3.4 EXERCISES + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +a. Find the velocity and acceleration functions. + +b. Determine the time intervals when the object is slowing down or speeding up. + +150. \( s(t) = 2t^3 - 3t^2 - 12t + 8 \) + +151. \( s(t) = 2t^3 - 15t^2 + 36t - 10 \) + +152. \( s(t) = \frac{t}{1 + t^2} \) + +153. A rocket is fired vertically upward from the ground. The distance \( s \) in feet that the rocket travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 560t \). + +a. Find the velocity of the rocket 3 seconds after being fired. + +b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/s from the top of a 64-foot-tall building. After \( t \) seconds, its height above the ground is given by \( s(t) = -16t^2 - 8t + 64 \). + +a. Determine how long it takes for the ball to hit the ground. + +b. Determine the velocity of the ball when it hits the ground. + +155. The position function \( s(t) = t^2 - 3t - 4 \) represents the position of the back of a car backing out of a driveway and then driving in a straight line, where \( s \) is in feet and \( t \) is in seconds. In this case, \( s(t) = 0 \) represents the time at which the back of the car is at the garage door, so \( s(0) = -4 \) is the starting position of the car, 4 feet inside the garage. + +a. Determine the velocity of the car when \( s(t) = 0 \). + +b. Determine the velocity of the car when \( s(t) = 14 \). + +156. The position of a hummingbird flying along a straight line in \( t \) seconds is given by \( s(t) = 3t^3 - 7t \) meters. + +a. Determine the velocity of the bird at \( t = 1 \) sec. + +b. Determine the acceleration of the bird at \( t = 1 \) sec. + +c. Determine the acceleration of the bird when the velocity equals 0. + +157. A potato is launched vertically upward with an initial velocity of 100 ft/s from a potato gun at the top of an 85-foot-tall building. The distance in feet that the potato travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 100t + 85 \). + +a. Find the velocity of the potato after 0.5 s and 5.75 s. + +b. Find the speed of the potato at 0.5 s and 5.75 s. + +c. Determine when the potato reaches its maximum height. + +d. Find the acceleration of the potato at 0.5 s and 1.5 s. + +e. Determine how long the potato is in the air. + +f. Determine the velocity of the potato upon hitting the ground. + +158. The position function \( s(t) = t^3 - 8t \) gives the position in miles of a freight train where east is the positive direction and \( t \) is measured in hours. + +a. Determine the direction the train is traveling when \( s(t) = 0 \). + +b. Determine the direction the train is traveling when \( s(t) = 0 \). + +c. Determine the time intervals when the train is slowing down or speeding up. + +159. The following graph shows the position \( y = s(t) \) of an object moving along a straight line. + +[Graph of a position function] + +a. Use the graph of the position function to determine the time intervals when the velocity is positive, negative, or zero. + +b. Sketch the graph of the velocity function. + +c. Use the graph of the velocity function to determine the time intervals when the acceleration is positive, negative, or zero. + +d. Determine the time intervals when the object is speeding up or slowing down. \ No newline at end of file diff --git a/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_5.md b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_5.md new file mode 100644 index 0000000..681438d --- /dev/null +++ b/olmocr/bench/sample_data/olmocr/openstax_caculus_pg_273_5.md @@ -0,0 +1,71 @@ +3.4 EXERCISES + +For the following exercises, the given functions represent the position of a particle traveling along a horizontal line. + +a. Find the velocity and acceleration functions. + +b. Determine the time intervals when the object is slowing down or speeding up. + +150. \( s(t) = 2t^3 - 3t^2 - 12t + 8 \) + +151. \( s(t) = 2t^3 - 15t^2 + 36t - 10 \) + +152. \( s(t) = \frac{t}{1 + t^2} \) + +153. A rocket is fired vertically upward from the ground. The distance \( s \) in feet that the rocket travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 560t \). + +a. Find the velocity of the rocket 3 seconds after being fired. + +b. Find the acceleration of the rocket 3 seconds after being fired. + +154. A ball is thrown downward with a speed of 8 ft/s from the top of an 85-foot-tall building. After \( t \) seconds, its height above the ground is given by \( s(t) = -16t^2 - 8t + 64 \). + +a. Determine how long it takes for the ball to hit the ground. + +b. Determine the velocity of the ball when it hits the ground. + +155. The position function \( s(t) = t^2 - 3t - 4 \) represents the position of the back of a car backing out of a driveway and then driving in a straight line, where \( s \) is in feet and \( t \) is in seconds. In this case, \( s(t) = 0 \) represents the time at which the back of the car is at the garage door, so \( s(0) = -4 \) is the starting position of the car, 4 feet inside the garage. + +a. Determine the velocity of the car when \( s(t) = 0 \). + +b. Determine the velocity of the car when \( s(t) = 14 \). + +156. The position of a hummingbird flying along a straight line in \( t \) seconds is given by \( s(t) = 3t^3 - 7t \) meters. + +a. Determine the velocity of the bird at \( t = 1 \) sec. + +b. Determine the acceleration of the bird at \( t = 1 \) sec. + +c. Determine the acceleration of the bird when the velocity equals 0. + +157. A potato is launched vertically upward with an initial velocity of 100 ft/s from a potato gun at the top of an 85-foot-tall building. The distance in feet that the potato travels from the ground after \( t \) seconds is given by \( s(t) = -16t^2 + 100t + 85 \). + +a. Find the velocity of the potato after 0.5 s and 5.75 s. + +b. Find the speed of the potato at 0.5 s and 5.75 s. + +c. Determine when the potato reaches its maximum height. + +d. Find the acceleration of the potato at 0.5 s and 1.5 s. + +e. Determine how long the potato is in the air. + +f. Determine the velocity of the potato upon hitting the ground. + +158. The position function \( s(t) = t^3 - 8t \) gives the position in miles of a freight train where east is the positive direction and \( t \) is measured in hours. + +a. Determine the direction the train is traveling when \( s(t) = 0 \). + +b. Determine the direction the train is traveling when \( a(t) = 0 \). + +c. Determine the time intervals when the train is slowing down or speeding up. + +159. The following graph shows the position \( y = s(t) \) of an object moving along a straight line. + +a. Use the graph of the position function to determine the time intervals when the velocity is positive, negative, or zero. + +b. Sketch the graph of the velocity function. + +Use the graph of the velocity function to determine the time intervals when the acceleration is positive, negative, or zero. + +d. Determine the time intervals when the object is speeding up or slowing down. \ No newline at end of file