Spaces:
Sleeping
Sleeping
File size: 4,381 Bytes
c917d47 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 |
encoding_model: cl100k_base
skip_workflows: []
llm:
api_key: ${GRAPHRAG_API_KEY}
type: openai_chat
model: gpt-4o-mini
model_supports_json: true
max_tokens: 4000
temperature: 0
embeddings:
async_mode: threaded
batch_size: 16
vector_store:
type: lancedb
db_uri: 'output/lancedb'
container_name: default
overwrite: true
llm:
api_key: ${GRAPHRAG_API_KEY}
type: openai_embedding
model: text-embedding-3-small
chunks:
size: 500
overlap: 50
group_by_columns: [id]
input:
type: file
file_type: text
base_dir: "input"
file_pattern: ".*\\.txt$"
recursive: true
source_tracking: true
processing_order:
- path: "first_paragraphs"
priority: 1
purpose: "graph_building"
- path: "full_documents"
priority: 2
purpose: "retrieval"
entity_extraction:
prompt: "prompts/entity_extraction.txt"
entity_types:
- "Baggage Type"
- "Dimension"
- "Linear Dimension"
- "Weight"
- "Material Type"
- "Wheel Configuration"
- "Measurement Unit"
- "Size Category"
- "Weight Category"
- "Airline"
- "Alliance"
- "Airport"
- "Route Type"
- "Travel Class"
- "Cabin Section"
- "Aircraft Type"
- "Restriction"
- "Exemption"
- "Policy"
- "Fee Structure"
- "Currency"
- "Allowance"
- "Special Item"
- "Prohibited Item"
- "Restricted Item"
- "Dangerous Good"
- "Fragile Item"
- "Valuable Item"
- "Required Document"
- "Label Type"
- "Tag Category"
- "Service Type"
- "Handler Role"
- "Service Location"
- "Time Period"
- "Passenger Type"
- "Membership Level"
- "Group Category"
max_gleanings: 2
source_filter: "first_paragraphs"
claim_extraction:
enabled: true
claim_types:
- "Basic Size Restriction"
- "Oversize Condition"
- "Weight Limit Standard"
- "Overweight Condition"
- "Combined Dimension Limit"
- "Cabin Storage Requirement"
- "Standard Fee"
- "Excess Fee"
- "Oversize Fee"
- "Overweight Fee"
- "Special Handling Fee"
- "Season Surcharge"
- "Route-Specific Fee"
- "Multi-Piece Pricing"
- "Fee Waiver Condition"
- "Basic Allowance"
- "Class-Based Allowance"
- "Status-Based Allowance"
- "Route-Based Allowance"
- "Special Group Allowance"
- "Seasonal Allowance"
- "Equipment Allowance"
- "Prohibited Item Policy"
- "Restricted Item Condition"
- "Dangerous Goods Policy"
- "Special Item Restriction"
- "Packaging Requirement"
- "Declaration Requirement"
- "Check-in Deadline"
- "Special Handling Procedure"
- "Priority Handling Rule"
- "Transfer Handling Policy"
- "Delivery Service Policy"
- "Storage Policy"
- "Liability Limit"
- "Insurance Requirement"
- "Claim Procedure"
- "Compensation Policy"
- "Time Limit Policy"
- "Weather Restriction"
- "Seasonal Restriction"
- "Aircraft Limitation"
- "Route Restriction"
- "Connection Impact"
- "Tag Requirement"
- "Label Requirement"
- "Documentation Requirement"
- "Declaration Policy"
- "Handling Standard"
- "Service Level Agreement"
- "Priority Service Standard"
- "Delivery Time Standard"
- "Medical Exception"
- "Military Exception"
- "Diplomatic Exception"
- "Event Exception"
- "Emergency Exception"
prompt: "prompts/claim_extraction.txt"
description: "Extract baggage measurements, weight limits, and restrictions from airline documentation."
max_gleanings: 2
source_filter: "first_paragraphs"
local_search:
text_unit_prop: 0.7
community_prop: 0.3
top_k_mapped_entities: 15
top_k_relationships: 15
max_tokens: 4000
source_priority:
graph_search: "first_paragraphs"
answer_retrieval: "full_documents"
global_search:
max_tokens: 4000
data_max_tokens: 4000
map_max_tokens: 1000
reduce_max_tokens: 2000
allow_general_knowledge: false
min_score_threshold: 0.1
concurrency: 10
embed_graph:
enabled: true
num_walks: 100
walk_length: 10
window_size: 5
iterations: 10
umap:
enabled: true
n_neighbors: 15
min_dist: 0.1
n_components: 2
storage:
type: file
base_dir: "output"
cache:
type: file
base_dir: "cache"
reporting:
type: file
base_dir: "reports"
include_source_tracking: true |