hynky HF Staff commited on
Commit
362fc2c
·
0 Parent(s):

Initial commit

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +3 -0
  2. README.md +8 -0
  3. extraction/non_truncated/record_0.json +3 -0
  4. extraction/non_truncated/record_1.json +3 -0
  5. extraction/non_truncated/record_10.json +3 -0
  6. extraction/non_truncated/record_11.json +3 -0
  7. extraction/non_truncated/record_12.json +3 -0
  8. extraction/non_truncated/record_13.json +3 -0
  9. extraction/non_truncated/record_14.json +3 -0
  10. extraction/non_truncated/record_15.json +3 -0
  11. extraction/non_truncated/record_16.json +3 -0
  12. extraction/non_truncated/record_17.json +3 -0
  13. extraction/non_truncated/record_18.json +3 -0
  14. extraction/non_truncated/record_19.json +3 -0
  15. extraction/non_truncated/record_2.json +3 -0
  16. extraction/non_truncated/record_20.json +3 -0
  17. extraction/non_truncated/record_21.json +3 -0
  18. extraction/non_truncated/record_22.json +3 -0
  19. extraction/non_truncated/record_23.json +3 -0
  20. extraction/non_truncated/record_24.json +3 -0
  21. extraction/non_truncated/record_25.json +3 -0
  22. extraction/non_truncated/record_26.json +3 -0
  23. extraction/non_truncated/record_27.json +3 -0
  24. extraction/non_truncated/record_28.json +3 -0
  25. extraction/non_truncated/record_29.json +3 -0
  26. extraction/non_truncated/record_3.json +3 -0
  27. extraction/non_truncated/record_30.json +3 -0
  28. extraction/non_truncated/record_31.json +3 -0
  29. extraction/non_truncated/record_32.json +3 -0
  30. extraction/non_truncated/record_33.json +3 -0
  31. extraction/non_truncated/record_34.json +3 -0
  32. extraction/non_truncated/record_35.json +3 -0
  33. extraction/non_truncated/record_36.json +3 -0
  34. extraction/non_truncated/record_37.json +3 -0
  35. extraction/non_truncated/record_38.json +3 -0
  36. extraction/non_truncated/record_39.json +3 -0
  37. extraction/non_truncated/record_4.json +3 -0
  38. extraction/non_truncated/record_40.json +3 -0
  39. extraction/non_truncated/record_41.json +3 -0
  40. extraction/non_truncated/record_42.json +3 -0
  41. extraction/non_truncated/record_43.json +3 -0
  42. extraction/non_truncated/record_44.json +3 -0
  43. extraction/non_truncated/record_45.json +3 -0
  44. extraction/non_truncated/record_46.json +3 -0
  45. extraction/non_truncated/record_47.json +3 -0
  46. extraction/non_truncated/record_48.json +3 -0
  47. extraction/non_truncated/record_49.json +3 -0
  48. extraction/non_truncated/record_5.json +3 -0
  49. extraction/non_truncated/record_6.json +3 -0
  50. extraction/non_truncated/record_7.json +3 -0
.gitattributes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ *.json filter=lfs diff=lfs merge=lfs -text
2
+ *.jsonl filter=lfs diff=lfs merge=lfs -text
3
+ *.pdf filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ title: PDF Extraction Comparisson
2
+ emoji: 📉
3
+ colorFrom: green
4
+ colorTo: gray
5
+ sdk: gradio
6
+ sdk_version: 5.27.0
7
+ app_file: extractor_compare.py
8
+ pinned: false
extraction/non_truncated/record_0.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:167521da014ee1816adfa9667e045dc5835ebbfde0d4c036a1c354e15f51dbca
3
+ size 63882
extraction/non_truncated/record_1.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f0a96a2e7dc9833c93b2817f91ea2cdb46844bd8f216b34ec88bbb3b404183e
3
+ size 2355885
extraction/non_truncated/record_10.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b4a9ac963d2795aef7a86d20944049d2554a7cf75dd94a58c17115dc581299
3
+ size 1477192
extraction/non_truncated/record_11.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cf21c60728cba6f508dbf44c98cd4b968df2cce2bfcb05f0647762edf54f487
3
+ size 68649
extraction/non_truncated/record_12.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc2d0f828fdf221ee601cc6904e599665b4ae12082e2b9d2a76c2f7d32528921
3
+ size 58362
extraction/non_truncated/record_13.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2182ed09edf5a0aa885f1ac28dddf070d96342c8606fd27e4315e44b39ade036
3
+ size 263549
extraction/non_truncated/record_14.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3066f1b77f8d4190cf2928a09f883dc6b3f628cf257a9479d9bf822df465e389
3
+ size 610239
extraction/non_truncated/record_15.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eb949316ebfd20294ddd0c1e1ac73a748da4a3f1bfefc819f2c292b54e4ef55
3
+ size 225940
extraction/non_truncated/record_16.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3f7bec9722662ec468459191a19077ccbdda6f4c4bd7156f0d3ba46908afed5
3
+ size 207706
extraction/non_truncated/record_17.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c6eeee023c92b02ccc1dcb9d775e80eab03a82f78a062e266590427aa8cd5cd
3
+ size 151205
extraction/non_truncated/record_18.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ca829e8020f472452f7c41ec63f3ddfcdd6dce0b04167c383c311e290129124
3
+ size 730429
extraction/non_truncated/record_19.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a5e819288bc5b404228abe38e4e07c966a13597f8cb1ae0336c1d58cebd0573
3
+ size 4347952
extraction/non_truncated/record_2.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26cb541e4ed8038eb44dce3f74a40b2a748f09e3ce98168c95b1ae6959699e31
3
+ size 200511
extraction/non_truncated/record_20.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3695a6b19de6b483e6f9f4ce417584d3bca274d1a18bb88f1fc3bc3a4e5a372
3
+ size 34621
extraction/non_truncated/record_21.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60619c8ebe2caba7c9e2ea3304418a461bd351b90ec6a1a3a3af31fb92ef0196
3
+ size 1403253
extraction/non_truncated/record_22.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9939ba567c0e42fd17ecef79384c5125e56cb5bd53f2229b0115301d048ecc00
3
+ size 505232
extraction/non_truncated/record_23.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81be2481d68dd31f741082419de4dcfd8aa4575200d1fddad407f476a1dedd76
3
+ size 889179
extraction/non_truncated/record_24.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf0f8312ea71e37843d206374692ae41e92f42d442a4c5ec7599eb3ca59e0a88
3
+ size 951925
extraction/non_truncated/record_25.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86828204d28fb8bbc5031f49548d8a9949767c58ffae242bd401a8996461475b
3
+ size 30260
extraction/non_truncated/record_26.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25e63f13b7efa1af614ed705b31a05ea32481e9e354964e1a207652b66a4e19
3
+ size 189677
extraction/non_truncated/record_27.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7709908a0df97a54b8b99f423d646bb280904efa26c97b83989021aacf32cb5
3
+ size 384357
extraction/non_truncated/record_28.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa2f0b2e981d2972a9c8a52234a5a736eb0f6c86cdb36c61e76b8580a4ec6583
3
+ size 38877
extraction/non_truncated/record_29.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ad40b768f55f12542d29a4abb4c832188401046a13611671199350b4c95d921
3
+ size 135635
extraction/non_truncated/record_3.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b1ff68c4d0a3f81aaa60d970767832f823c498286f8c149efeb25b9e6079648
3
+ size 655199
extraction/non_truncated/record_30.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5ac40be45da7450a9430f86b45eddb1f0913f0884ed84e67dff6a9d9eae0596
3
+ size 196521
extraction/non_truncated/record_31.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3120768e0f4f63acfb4ea6c504634c129d40179730e9a268170f4a4cdc1904d
3
+ size 885829
extraction/non_truncated/record_32.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f86e7ab93d134a1fa59bfe062ba6fc226a323f976012320ac61d9b3e56bde0b
3
+ size 372363
extraction/non_truncated/record_33.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ecf8838485b6667b1362f39f5a0d7886b4a05ed61f80fccdf2f71b9fe9b98c7
3
+ size 5082783
extraction/non_truncated/record_34.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:395237b321ad926362bd520315d527184261f73cf031533aa170d2a36ef80409
3
+ size 38339
extraction/non_truncated/record_35.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45172f2b9c3975dc0fa102323d65c98606edaf0dfcfaf1e94c5075bb6ba58eb9
3
+ size 363612
extraction/non_truncated/record_36.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1838aa1feed4c9f70dd600276f4d83249ab8f046acc9d67a9028abacde224af1
3
+ size 696226
extraction/non_truncated/record_37.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eebf8813eba242eaf54427058dadd927c037074645fb6872b068f692e35d8cc
3
+ size 188427
extraction/non_truncated/record_38.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c90ff6c48476635f96802b94a776605f887bcbc305b23e1b4c579c3f8ae567b9
3
+ size 858917
extraction/non_truncated/record_39.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0859d7ced21f7147b79de2e68798076063f3630379e1bd62097750191658d2ba
3
+ size 231498
extraction/non_truncated/record_4.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5dc03dd9e70cbdfbe2f1a2010686f18f984ca5c4d94e6f006de0d4225c43c57
3
+ size 336622
extraction/non_truncated/record_40.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6831ac023d481844a3368394b5853697f6d1ac5b7ee8042f606c2cc72de28492
3
+ size 189523
extraction/non_truncated/record_41.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b2c3b9c753feb18018980143409d4a670a2b36f85f271d66e3574297391bb69
3
+ size 1717290
extraction/non_truncated/record_42.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:103d572230006e3231311feaa9fb18541fbe7347330c195e7e49f8462c131936
3
+ size 504077
extraction/non_truncated/record_43.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c26bd2a27e3f7c1cae06a965f4b36333d9eac548238f155a9f22502c1edc9ed8
3
+ size 178433
extraction/non_truncated/record_44.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc3c4e63fe0d91dcc7927005b6bbce23aad1f6a76f438b12334952652bf5811f
3
+ size 578235
extraction/non_truncated/record_45.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4828368d4df51ee31aac1d332965e597d2ad7e7d69eb12c62547984d333b9c7
3
+ size 65628
extraction/non_truncated/record_46.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1a5c9af7071dc69a5a2ebc8ba8fa75e55dbcca845215d60cfd82662803f05b4
3
+ size 353066
extraction/non_truncated/record_47.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cb7f41c1b0950e0a87846f0b79077eadbff0d70dad758904db03df28b4db761
3
+ size 587671
extraction/non_truncated/record_48.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a57ef801045de8bb4bd18e4ba6e9385a97b64b1263e8e2f215b53ef2c3a3785
3
+ size 139104
extraction/non_truncated/record_49.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86703b12aaa2586771ad8140184dedfe719c490bfdeaf1098d7b447d03b5a1e3
3
+ size 424608
extraction/non_truncated/record_5.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e81014ac3d91bf012f645e1732f1292ab417a4bffe50f0a37d3ba5bb99cb0549
3
+ size 463779
extraction/non_truncated/record_6.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c581ce6b5af035a25ba1f0a0a3c3c25bb95bb3a8009c17a09430d9d51153a4e7
3
+ size 723599
extraction/non_truncated/record_7.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e71c27130c52ca65accba4ca8415144d3aafc3167bafcc0e0736978e192b1745
3
+ size 402046