SOURCES.txt 3.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131
  1. LICENSE
  2. README.md
  3. pyproject.toml
  4. olmocr/__init__.py
  5. olmocr/check.py
  6. olmocr/datatypes.py
  7. olmocr/image_utils.py
  8. olmocr/loadertest.py
  9. olmocr/metrics.py
  10. olmocr/pipeline.py
  11. olmocr/py.typed
  12. olmocr/repeatdetect.py
  13. olmocr/s3_utils.py
  14. olmocr/version.py
  15. olmocr/work_queue.py
  16. olmocr.egg-info/PKG-INFO
  17. olmocr.egg-info/SOURCES.txt
  18. olmocr.egg-info/dependency_links.txt
  19. olmocr.egg-info/requires.txt
  20. olmocr.egg-info/top_level.txt
  21. olmocr/bench/__init__.py
  22. olmocr/bench/benchmark.py
  23. olmocr/bench/convert.py
  24. olmocr/bench/prompts.py
  25. olmocr/bench/report.py
  26. olmocr/bench/review_app.py
  27. olmocr/bench/review_app_latex.py
  28. olmocr/bench/tests.py
  29. olmocr/bench/utils.py
  30. olmocr/bench/katex/__init__.py
  31. olmocr/bench/katex/render.py
  32. olmocr/bench/miners/check_headers_footers.py
  33. olmocr/bench/miners/check_multicolumn.py
  34. olmocr/bench/miners/check_old_scans_math.py
  35. olmocr/bench/miners/cleanup_data.py
  36. olmocr/bench/miners/cleanup_urls.py
  37. olmocr/bench/miners/delete_rejected.py
  38. olmocr/bench/miners/download_math.py
  39. olmocr/bench/miners/mine_diffs.py
  40. olmocr/bench/miners/mine_headers_footers.py
  41. olmocr/bench/miners/mine_long_tiny_text.py
  42. olmocr/bench/miners/mine_math.py
  43. olmocr/bench/miners/mine_multi_column.py
  44. olmocr/bench/miners/mine_old_scan_pdf.py
  45. olmocr/bench/miners/mine_old_scans.py
  46. olmocr/bench/miners/mine_old_scans_math.py
  47. olmocr/bench/miners/mine_reading_order.py
  48. olmocr/bench/miners/mine_tables_gemini.py
  49. olmocr/bench/miners/mine_tables_gpt.py
  50. olmocr/bench/miners/pick_mediod.py
  51. olmocr/bench/runners/__init__.py
  52. olmocr/bench/runners/run_chatgpt.py
  53. olmocr/bench/runners/run_claude.py
  54. olmocr/bench/runners/run_docling.py
  55. olmocr/bench/runners/run_gemini.py
  56. olmocr/bench/runners/run_gotocr.py
  57. olmocr/bench/runners/run_marker.py
  58. olmocr/bench/runners/run_mineru.py
  59. olmocr/bench/runners/run_mistral.py
  60. olmocr/bench/runners/run_olmocr_pipeline.py
  61. olmocr/bench/runners/run_rolmocr.py
  62. olmocr/bench/runners/run_server.py
  63. olmocr/bench/runners/run_transformers.py
  64. olmocr/bench/scripts/difference_viewer.py
  65. olmocr/bench/scripts/run_difference.py
  66. olmocr/bench/scripts/url_matcher.py
  67. olmocr/bench/synth/__init__.py
  68. olmocr/bench/synth/mine_html_templates.py
  69. olmocr/bench/synth/test_mine.py
  70. olmocr/data/__init__.py
  71. olmocr/data/buildsilver.py
  72. olmocr/data/buildsilverdatasummary.py
  73. olmocr/data/buildtestset.py
  74. olmocr/data/convertsilver_birr.py
  75. olmocr/data/convertsilver_openai.py
  76. olmocr/data/renderpdf.py
  77. olmocr/data/runopenaibatch.py
  78. olmocr/eval/__init__.py
  79. olmocr/eval/buildelo.py
  80. olmocr/eval/evalhtml.py
  81. olmocr/eval/evalhtml_template.html
  82. olmocr/eval/runeval.py
  83. olmocr/eval/scoreelo.py
  84. olmocr/eval/dolma_refine/aligners.py
  85. olmocr/eval/dolma_refine/metrics.py
  86. olmocr/eval/dolma_refine/registry.py
  87. olmocr/eval/dolma_refine/segmenters.py
  88. olmocr/filter/__init__.py
  89. olmocr/filter/coherency.py
  90. olmocr/filter/filter.py
  91. olmocr/prompts/__init__.py
  92. olmocr/prompts/anchor.py
  93. olmocr/prompts/prompts.py
  94. olmocr/train/__init__.py
  95. olmocr/train/dataloader.py
  96. olmocr/train/dataprep.py
  97. olmocr/train/fixqwen25vlcheckpoint.py
  98. olmocr/train/inference.py
  99. olmocr/train/loaddataset.py
  100. olmocr/train/train.py
  101. olmocr/train/utils.py
  102. olmocr/train/core/__init__.py
  103. olmocr/train/core/adapters.py
  104. olmocr/train/core/cli.py
  105. olmocr/train/core/compression.py
  106. olmocr/train/core/config.py
  107. olmocr/train/core/errors.py
  108. olmocr/train/core/loggers.py
  109. olmocr/train/core/paths.py
  110. olmocr/train/core/state.py
  111. olmocr/train/hf/__init__.py
  112. olmocr/train/hf/convertjsontoparquet.py
  113. olmocr/train/hf/hfhub_upload.py
  114. olmocr/train/hf/warc_parser.py
  115. olmocr/train/molmo/__init__.py
  116. olmocr/train/molmo/config_molmo.py
  117. olmocr/train/molmo/image_processing_molmo.py
  118. olmocr/train/molmo/modeling_molmo.py
  119. olmocr/train/molmo/preprocessing_molmo.py
  120. olmocr/viewer/__init__.py
  121. olmocr/viewer/dolmaviewer.py
  122. olmocr/viewer/dolmaviewer_template.html
  123. tests/test_anchor.py
  124. tests/test_dataloader.py
  125. tests/test_dataprep.py
  126. tests/test_filter.py
  127. tests/test_integration.py
  128. tests/test_molmo.py
  129. tests/test_s3_work_queue.py
  130. tests/test_sglang.py
  131. tests/test_tests.py