File size: 1,956 Bytes
fbea007
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
name: tableformer_accurate_jpqd
description: TableFormer accurate model for high-precision table structure recognition, optimized with JPQD quantization
framework: ONNX
task: table-structure-recognition
domain: computer-vision
subdomain: document-analysis

model_info:
  architecture: TableFormer (Transformer-based)
  paper: "TableFormer: Table Structure Understanding With Transformers"
  paper_url: "https://doi.org/10.1109/CVPR52688.2022.00457"
  original_source: Docling
  original_repo: "https://github.com/DS4SD/docling"
  optimization: JPQD quantization
  variant: accurate
  
specifications:
  input_shape: [1, 10]  # Based on model analysis
  input_type: int64
  input_format: Processed table features
  output_shape: [1, 10]
  output_type: float32
  batch_size: dynamic
  
performance:
  teds_score_simple: 95.4
  teds_score_complex: 90.1  
  teds_score_overall: 93.6
  inference_time_cpu_ms: ~1
  accuracy_retention: ">99%"
  
deployment:
  runtime: onnxruntime
  hardware: CPU-optimized
  precision: INT8 weights, FP32 activations
  memory_usage_mb: ~25
  
usage:
  preprocessing:
    - Extract table regions from document images
    - Apply TableFormer-specific preprocessing
    - Convert to model input format
  postprocessing:
    - Parse table structure predictions
    - Extract cell boundaries and types
    - Generate structured table representation

benchmarks:
  dataset: PubTabNet, FinTabNet
  metric: TEDS (Tree-Edit-Distance-based Similarity)
  comparison:
    - "Better than Tabula (67.9 vs 93.6 TEDS)"
    - "Better than Camelot (73.0 vs 93.6 TEDS)" 
    - "Better than EDD (88.3 vs 93.6 TEDS)"

applications:
  - PDF document conversion
  - Academic paper processing  
  - Financial document analysis
  - Legal document digitization
  - Invoice and form processing

license: cdla-permissive-2.0
tags:
  - table-structure-recognition
  - tableformer
  - document-analysis
  - onnx
  - quantized
  - jpqd
  - docling
  - accurate