-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathdatabricks.yml
More file actions
93 lines (89 loc) · 3.34 KB
/
databricks.yml
File metadata and controls
93 lines (89 loc) · 3.34 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
bundle:
name: doc-intel-10k
include:
- resources/**/*.yml
variables:
catalog:
description: Unity Catalog name
default: workspace
lakebase_instance:
description: Lakebase Postgres instance name (must be DNS-compliant — alphanumeric + hyphens only)
default: docintel-state
lakebase_stopped:
description: Whether the Lakebase Postgres instance should be stopped. Must be false on first creation (the API rejects creating directly into stopped state); flip to true after the instance exists if the env should be paused.
default: false
schema:
description: Schema for all 10-K Analyst resources
default: docintel_10k
service_principal_id:
description: Service Principal application ID for prod deploys
default: ""
warehouse_id:
description: SQL warehouse used by index-refresh and dashboards
lookup:
warehouse: Serverless Starter Warehouse
embedding_model_endpoint_name:
description: Mosaic AI embedding endpoint used by Vector Search
default: databricks-bge-large-en
quality_threshold:
description: Minimum quality_score (0-30) required for embed_eligible
default: 22
max_pdf_bytes:
description: Reject filings larger than this many bytes (50 MB)
default: 52428800
analyst_group:
description: UC group granted SELECT/USE on the catalog/schema
default: account users
agent_endpoint_name:
description: Agent Bricks Supervisor serving endpoint name resolved by agent.document_intelligence_agent
default: UNSET_AGENT_BRICKS_ENDPOINT
app_obo_required:
description: Whether the Databricks App requires user-token passthrough for Agent Bricks calls
default: "true"
targets:
demo:
default: true
workspace:
profile: DEFAULT
# Per-user demo path so two engineers' deploys don't stomp each other.
# `${workspace.current_user.userName}` resolves to the auth profile's
# email at deploy time.
root_path: /Workspace/Users/${workspace.current_user.userName}/.bundle/${bundle.name}/demo
variables:
catalog: workspace
schema: docintel_10k_demo
lakebase_instance: docintel-demo-state-v1
app_obo_required: "false"
resources:
pipelines:
doc_intel_pipeline:
development: true
# Demo override: triggered runs only, to avoid a continuously-running
# serverless cluster during smoke iterations. Prod inherits
# continuous: true from resources/foundation/doc_intel.pipeline.yml.
continuous: false
prod:
mode: production
workspace:
profile: DEFAULT
root_path: /Workspace/Shared/.bundle/${bundle.name}/prod
# Constitution VI + Databricks Asset Bundles production mode requires a
# service-principal `run_as`. `service_principal_id` defaults to "" so
# `bundle validate -t prod` fails loudly until set — that's the safety.
# Override via `--var service_principal_id=<sp-app-id>` on deploy.
run_as:
service_principal_name: ${var.service_principal_id}
variables:
catalog: workspace
schema: docintel_10k
lakebase_instance: docintel-prod-state
lakebase_stopped: false
app_obo_required: "true"
resources:
apps:
analyst_app:
user_api_scopes:
- serving.serving-endpoints
- sql
- iam.access-control:read
- iam.current-user:read