Spaces:
Sleeping
Sleeping
Upload 2 files
Browse files- enhanced_sber_index.pkl +3 -0
- enhanced_sber_metadata.json +24 -0
enhanced_sber_index.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4255dabfd17f7b99f055472c20ac8c32d0b0c84411f73026fdc9bf66bdf5c01a
|
3 |
+
size 2912113
|
enhanced_sber_metadata.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"processing_stats": {
|
3 |
+
"total_pages": 402,
|
4 |
+
"pages_with_tables": 34,
|
5 |
+
"total_tables": 84,
|
6 |
+
"total_text_chunks": 1925,
|
7 |
+
"total_table_chunks": 84,
|
8 |
+
"processing_time": 151.77763056755066,
|
9 |
+
"errors": []
|
10 |
+
},
|
11 |
+
"index_metadata": {
|
12 |
+
"total_chunks": 2009,
|
13 |
+
"text_chunks": 1925,
|
14 |
+
"table_chunks": 84,
|
15 |
+
"avg_chunk_length": 532.5251368840219,
|
16 |
+
"avg_token_count": 248.2404181184669,
|
17 |
+
"pages_processed": 401,
|
18 |
+
"processing_method": "enhanced_pdfplumber_with_tables",
|
19 |
+
"table_pages": 34,
|
20 |
+
"total_words_indexed": 19261
|
21 |
+
},
|
22 |
+
"processing_date": "2025-07-06 05:00:48",
|
23 |
+
"source_file": "/mnt/c/Users/user/Documents/Работа/Сбер/Обучение/Курсовой проект/Исходные данные/Сбер 2023.pdf"
|
24 |
+
}
|