File size: 4,381 Bytes
c917d47
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
encoding_model: cl100k_base
skip_workflows: []
llm:
  api_key: ${GRAPHRAG_API_KEY}
  type: openai_chat  
  model: gpt-4o-mini
  model_supports_json: true
  max_tokens: 4000
  temperature: 0

embeddings:
  async_mode: threaded
  batch_size: 16
  vector_store:
    type: lancedb
    db_uri: 'output/lancedb'
    container_name: default
    overwrite: true
  llm:
    api_key: ${GRAPHRAG_API_KEY}
    type: openai_embedding
    model: text-embedding-3-small

chunks:
  size: 500
  overlap: 50
  group_by_columns: [id]

input:
  type: file
  file_type: text
  base_dir: "input"
  file_pattern: ".*\\.txt$"
  recursive: true
  source_tracking: true  
  processing_order:      
    - path: "first_paragraphs"
      priority: 1
      purpose: "graph_building"
    - path: "full_documents"
      priority: 2
      purpose: "retrieval"

entity_extraction:
  prompt: "prompts/entity_extraction.txt"
  entity_types:
    - "Baggage Type"
    - "Dimension"
    - "Linear Dimension"
    - "Weight"
    - "Material Type"
    - "Wheel Configuration"
    - "Measurement Unit"
    - "Size Category"
    - "Weight Category"
    - "Airline"
    - "Alliance"
    - "Airport"
    - "Route Type"
    - "Travel Class"
    - "Cabin Section"
    - "Aircraft Type"
    - "Restriction"
    - "Exemption"
    - "Policy"
    - "Fee Structure"
    - "Currency"
    - "Allowance"
    - "Special Item"
    - "Prohibited Item"
    - "Restricted Item"
    - "Dangerous Good"
    - "Fragile Item"
    - "Valuable Item"
    - "Required Document"
    - "Label Type"
    - "Tag Category"
    - "Service Type"
    - "Handler Role"
    - "Service Location"
    - "Time Period"
    - "Passenger Type"
    - "Membership Level"
    - "Group Category"
  max_gleanings: 2
  source_filter: "first_paragraphs"

claim_extraction:
  enabled: true
  claim_types:
    - "Basic Size Restriction"
    - "Oversize Condition"
    - "Weight Limit Standard"
    - "Overweight Condition"
    - "Combined Dimension Limit"
    - "Cabin Storage Requirement"
    - "Standard Fee"
    - "Excess Fee"
    - "Oversize Fee"
    - "Overweight Fee"
    - "Special Handling Fee"
    - "Season Surcharge"
    - "Route-Specific Fee"
    - "Multi-Piece Pricing"
    - "Fee Waiver Condition"
    - "Basic Allowance"
    - "Class-Based Allowance"
    - "Status-Based Allowance"
    - "Route-Based Allowance"
    - "Special Group Allowance"
    - "Seasonal Allowance"
    - "Equipment Allowance"
    - "Prohibited Item Policy"
    - "Restricted Item Condition"
    - "Dangerous Goods Policy"
    - "Special Item Restriction"
    - "Packaging Requirement"
    - "Declaration Requirement"
    - "Check-in Deadline"
    - "Special Handling Procedure"
    - "Priority Handling Rule"
    - "Transfer Handling Policy"
    - "Delivery Service Policy"
    - "Storage Policy"
    - "Liability Limit"
    - "Insurance Requirement"
    - "Claim Procedure"
    - "Compensation Policy"
    - "Time Limit Policy"
    - "Weather Restriction"
    - "Seasonal Restriction"
    - "Aircraft Limitation"
    - "Route Restriction"
    - "Connection Impact"
    - "Tag Requirement"
    - "Label Requirement"
    - "Documentation Requirement"
    - "Declaration Policy"
    - "Handling Standard"
    - "Service Level Agreement"
    - "Priority Service Standard"
    - "Delivery Time Standard"
    - "Medical Exception"
    - "Military Exception"
    - "Diplomatic Exception"
    - "Event Exception"
    - "Emergency Exception"
  prompt: "prompts/claim_extraction.txt"
  description: "Extract baggage measurements, weight limits, and restrictions from airline documentation."
  max_gleanings: 2
  source_filter: "first_paragraphs"

local_search:
  text_unit_prop: 0.7
  community_prop: 0.3
  top_k_mapped_entities: 15
  top_k_relationships: 15
  max_tokens: 4000
  source_priority:
    graph_search: "first_paragraphs"
    answer_retrieval: "full_documents"

global_search:
  max_tokens: 4000
  data_max_tokens: 4000
  map_max_tokens: 1000
  reduce_max_tokens: 2000
  allow_general_knowledge: false
  min_score_threshold: 0.1
  concurrency: 10

embed_graph:
  enabled: true
  num_walks: 100
  walk_length: 10
  window_size: 5
  iterations: 10

umap:
  enabled: true
  n_neighbors: 15
  min_dist: 0.1
  n_components: 2

storage:
  type: file
  base_dir: "output"

cache:
  type: file
  base_dir: "cache"

reporting:
  type: file
  base_dir: "reports"
  include_source_tracking: true