Commit
·
362fc2c
0
Parent(s):
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +3 -0
- README.md +8 -0
- extraction/non_truncated/record_0.json +3 -0
- extraction/non_truncated/record_1.json +3 -0
- extraction/non_truncated/record_10.json +3 -0
- extraction/non_truncated/record_11.json +3 -0
- extraction/non_truncated/record_12.json +3 -0
- extraction/non_truncated/record_13.json +3 -0
- extraction/non_truncated/record_14.json +3 -0
- extraction/non_truncated/record_15.json +3 -0
- extraction/non_truncated/record_16.json +3 -0
- extraction/non_truncated/record_17.json +3 -0
- extraction/non_truncated/record_18.json +3 -0
- extraction/non_truncated/record_19.json +3 -0
- extraction/non_truncated/record_2.json +3 -0
- extraction/non_truncated/record_20.json +3 -0
- extraction/non_truncated/record_21.json +3 -0
- extraction/non_truncated/record_22.json +3 -0
- extraction/non_truncated/record_23.json +3 -0
- extraction/non_truncated/record_24.json +3 -0
- extraction/non_truncated/record_25.json +3 -0
- extraction/non_truncated/record_26.json +3 -0
- extraction/non_truncated/record_27.json +3 -0
- extraction/non_truncated/record_28.json +3 -0
- extraction/non_truncated/record_29.json +3 -0
- extraction/non_truncated/record_3.json +3 -0
- extraction/non_truncated/record_30.json +3 -0
- extraction/non_truncated/record_31.json +3 -0
- extraction/non_truncated/record_32.json +3 -0
- extraction/non_truncated/record_33.json +3 -0
- extraction/non_truncated/record_34.json +3 -0
- extraction/non_truncated/record_35.json +3 -0
- extraction/non_truncated/record_36.json +3 -0
- extraction/non_truncated/record_37.json +3 -0
- extraction/non_truncated/record_38.json +3 -0
- extraction/non_truncated/record_39.json +3 -0
- extraction/non_truncated/record_4.json +3 -0
- extraction/non_truncated/record_40.json +3 -0
- extraction/non_truncated/record_41.json +3 -0
- extraction/non_truncated/record_42.json +3 -0
- extraction/non_truncated/record_43.json +3 -0
- extraction/non_truncated/record_44.json +3 -0
- extraction/non_truncated/record_45.json +3 -0
- extraction/non_truncated/record_46.json +3 -0
- extraction/non_truncated/record_47.json +3 -0
- extraction/non_truncated/record_48.json +3 -0
- extraction/non_truncated/record_49.json +3 -0
- extraction/non_truncated/record_5.json +3 -0
- extraction/non_truncated/record_6.json +3 -0
- extraction/non_truncated/record_7.json +3 -0
.gitattributes
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
*.json filter=lfs diff=lfs merge=lfs -text
|
2 |
+
*.jsonl filter=lfs diff=lfs merge=lfs -text
|
3 |
+
*.pdf filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
title: PDF Extraction Comparisson
|
2 |
+
emoji: 📉
|
3 |
+
colorFrom: green
|
4 |
+
colorTo: gray
|
5 |
+
sdk: gradio
|
6 |
+
sdk_version: 5.27.0
|
7 |
+
app_file: extractor_compare.py
|
8 |
+
pinned: false
|
extraction/non_truncated/record_0.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:167521da014ee1816adfa9667e045dc5835ebbfde0d4c036a1c354e15f51dbca
|
3 |
+
size 63882
|
extraction/non_truncated/record_1.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f0a96a2e7dc9833c93b2817f91ea2cdb46844bd8f216b34ec88bbb3b404183e
|
3 |
+
size 2355885
|
extraction/non_truncated/record_10.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09b4a9ac963d2795aef7a86d20944049d2554a7cf75dd94a58c17115dc581299
|
3 |
+
size 1477192
|
extraction/non_truncated/record_11.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cf21c60728cba6f508dbf44c98cd4b968df2cce2bfcb05f0647762edf54f487
|
3 |
+
size 68649
|
extraction/non_truncated/record_12.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc2d0f828fdf221ee601cc6904e599665b4ae12082e2b9d2a76c2f7d32528921
|
3 |
+
size 58362
|
extraction/non_truncated/record_13.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2182ed09edf5a0aa885f1ac28dddf070d96342c8606fd27e4315e44b39ade036
|
3 |
+
size 263549
|
extraction/non_truncated/record_14.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3066f1b77f8d4190cf2928a09f883dc6b3f628cf257a9479d9bf822df465e389
|
3 |
+
size 610239
|
extraction/non_truncated/record_15.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5eb949316ebfd20294ddd0c1e1ac73a748da4a3f1bfefc819f2c292b54e4ef55
|
3 |
+
size 225940
|
extraction/non_truncated/record_16.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3f7bec9722662ec468459191a19077ccbdda6f4c4bd7156f0d3ba46908afed5
|
3 |
+
size 207706
|
extraction/non_truncated/record_17.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c6eeee023c92b02ccc1dcb9d775e80eab03a82f78a062e266590427aa8cd5cd
|
3 |
+
size 151205
|
extraction/non_truncated/record_18.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ca829e8020f472452f7c41ec63f3ddfcdd6dce0b04167c383c311e290129124
|
3 |
+
size 730429
|
extraction/non_truncated/record_19.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a5e819288bc5b404228abe38e4e07c966a13597f8cb1ae0336c1d58cebd0573
|
3 |
+
size 4347952
|
extraction/non_truncated/record_2.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26cb541e4ed8038eb44dce3f74a40b2a748f09e3ce98168c95b1ae6959699e31
|
3 |
+
size 200511
|
extraction/non_truncated/record_20.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3695a6b19de6b483e6f9f4ce417584d3bca274d1a18bb88f1fc3bc3a4e5a372
|
3 |
+
size 34621
|
extraction/non_truncated/record_21.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60619c8ebe2caba7c9e2ea3304418a461bd351b90ec6a1a3a3af31fb92ef0196
|
3 |
+
size 1403253
|
extraction/non_truncated/record_22.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9939ba567c0e42fd17ecef79384c5125e56cb5bd53f2229b0115301d048ecc00
|
3 |
+
size 505232
|
extraction/non_truncated/record_23.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81be2481d68dd31f741082419de4dcfd8aa4575200d1fddad407f476a1dedd76
|
3 |
+
size 889179
|
extraction/non_truncated/record_24.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf0f8312ea71e37843d206374692ae41e92f42d442a4c5ec7599eb3ca59e0a88
|
3 |
+
size 951925
|
extraction/non_truncated/record_25.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86828204d28fb8bbc5031f49548d8a9949767c58ffae242bd401a8996461475b
|
3 |
+
size 30260
|
extraction/non_truncated/record_26.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a25e63f13b7efa1af614ed705b31a05ea32481e9e354964e1a207652b66a4e19
|
3 |
+
size 189677
|
extraction/non_truncated/record_27.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7709908a0df97a54b8b99f423d646bb280904efa26c97b83989021aacf32cb5
|
3 |
+
size 384357
|
extraction/non_truncated/record_28.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa2f0b2e981d2972a9c8a52234a5a736eb0f6c86cdb36c61e76b8580a4ec6583
|
3 |
+
size 38877
|
extraction/non_truncated/record_29.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ad40b768f55f12542d29a4abb4c832188401046a13611671199350b4c95d921
|
3 |
+
size 135635
|
extraction/non_truncated/record_3.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b1ff68c4d0a3f81aaa60d970767832f823c498286f8c149efeb25b9e6079648
|
3 |
+
size 655199
|
extraction/non_truncated/record_30.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5ac40be45da7450a9430f86b45eddb1f0913f0884ed84e67dff6a9d9eae0596
|
3 |
+
size 196521
|
extraction/non_truncated/record_31.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3120768e0f4f63acfb4ea6c504634c129d40179730e9a268170f4a4cdc1904d
|
3 |
+
size 885829
|
extraction/non_truncated/record_32.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f86e7ab93d134a1fa59bfe062ba6fc226a323f976012320ac61d9b3e56bde0b
|
3 |
+
size 372363
|
extraction/non_truncated/record_33.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ecf8838485b6667b1362f39f5a0d7886b4a05ed61f80fccdf2f71b9fe9b98c7
|
3 |
+
size 5082783
|
extraction/non_truncated/record_34.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:395237b321ad926362bd520315d527184261f73cf031533aa170d2a36ef80409
|
3 |
+
size 38339
|
extraction/non_truncated/record_35.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45172f2b9c3975dc0fa102323d65c98606edaf0dfcfaf1e94c5075bb6ba58eb9
|
3 |
+
size 363612
|
extraction/non_truncated/record_36.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1838aa1feed4c9f70dd600276f4d83249ab8f046acc9d67a9028abacde224af1
|
3 |
+
size 696226
|
extraction/non_truncated/record_37.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eebf8813eba242eaf54427058dadd927c037074645fb6872b068f692e35d8cc
|
3 |
+
size 188427
|
extraction/non_truncated/record_38.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c90ff6c48476635f96802b94a776605f887bcbc305b23e1b4c579c3f8ae567b9
|
3 |
+
size 858917
|
extraction/non_truncated/record_39.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0859d7ced21f7147b79de2e68798076063f3630379e1bd62097750191658d2ba
|
3 |
+
size 231498
|
extraction/non_truncated/record_4.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5dc03dd9e70cbdfbe2f1a2010686f18f984ca5c4d94e6f006de0d4225c43c57
|
3 |
+
size 336622
|
extraction/non_truncated/record_40.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6831ac023d481844a3368394b5853697f6d1ac5b7ee8042f606c2cc72de28492
|
3 |
+
size 189523
|
extraction/non_truncated/record_41.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b2c3b9c753feb18018980143409d4a670a2b36f85f271d66e3574297391bb69
|
3 |
+
size 1717290
|
extraction/non_truncated/record_42.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:103d572230006e3231311feaa9fb18541fbe7347330c195e7e49f8462c131936
|
3 |
+
size 504077
|
extraction/non_truncated/record_43.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c26bd2a27e3f7c1cae06a965f4b36333d9eac548238f155a9f22502c1edc9ed8
|
3 |
+
size 178433
|
extraction/non_truncated/record_44.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc3c4e63fe0d91dcc7927005b6bbce23aad1f6a76f438b12334952652bf5811f
|
3 |
+
size 578235
|
extraction/non_truncated/record_45.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4828368d4df51ee31aac1d332965e597d2ad7e7d69eb12c62547984d333b9c7
|
3 |
+
size 65628
|
extraction/non_truncated/record_46.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1a5c9af7071dc69a5a2ebc8ba8fa75e55dbcca845215d60cfd82662803f05b4
|
3 |
+
size 353066
|
extraction/non_truncated/record_47.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cb7f41c1b0950e0a87846f0b79077eadbff0d70dad758904db03df28b4db761
|
3 |
+
size 587671
|
extraction/non_truncated/record_48.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a57ef801045de8bb4bd18e4ba6e9385a97b64b1263e8e2f215b53ef2c3a3785
|
3 |
+
size 139104
|
extraction/non_truncated/record_49.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86703b12aaa2586771ad8140184dedfe719c490bfdeaf1098d7b447d03b5a1e3
|
3 |
+
size 424608
|
extraction/non_truncated/record_5.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e81014ac3d91bf012f645e1732f1292ab417a4bffe50f0a37d3ba5bb99cb0549
|
3 |
+
size 463779
|
extraction/non_truncated/record_6.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c581ce6b5af035a25ba1f0a0a3c3c25bb95bb3a8009c17a09430d9d51153a4e7
|
3 |
+
size 723599
|
extraction/non_truncated/record_7.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e71c27130c52ca65accba4ca8415144d3aafc3167bafcc0e0736978e192b1745
|
3 |
+
size 402046
|