Hebo Yang
05/16/2023, 4:00 PMrunRetries:
enabled: false
maxRetries: 0
daniel
05/16/2023, 4:01 PMdaniel
05/16/2023, 4:08 PMHebo Yang
05/16/2023, 4:13 PMlocal_artifact_storage:
module: dagster._core.storage.root
class: LocalArtifactStorage
config:
base_dir: /opt/dagster/dagster_home
run_storage:
module: dagster_postgres.run_storage
class: PostgresRunStorage
config:
postgres_db:
db_name: xyz
hostname: <http://xyz.us-west-2.rds.amazonaws.com|xyz.us-west-2.rds.amazonaws.com>
params: {}
password:
env: xyz
port: 5432
username: xyz
event_log_storage:
module: dagster_postgres.event_log
class: PostgresEventLogStorage
config:
postgres_db:
db_name: dagster_prod
hostname: <http://xyz.us-west-2.rds.amazonaws.com|xyz.us-west-2.rds.amazonaws.com>
params: {}
password:
env: xyz
port: 5432
username: xyz
compute_logs:
module: dagster._core.storage.noop_compute_log_manager
class: NoOpComputeLogManager
config: {}
schedule_storage:
module: dagster_postgres.schedule_storage
class: PostgresScheduleStorage
config:
postgres_db:
db_name: xyz
hostname: <http://xyz.us-west-2.rds.amazonaws.com|xyz.us-west-2.rds.amazonaws.com>
params: {}
password:
env: xyz
port: 5432
username: xyz
scheduler:
module: dagster._core.scheduler
class: DagsterDaemonScheduler
config: {}
run_coordinator:
module: dagster._core.run_coordinator
class: QueuedRunCoordinator
config:
max_concurrent_runs: 125
tag_concurrency_limits:
- key: dagster/sensor
limit: 80
- key: dagster/backfill
limit: 65
- key: databricks
limit: 50
- key: fabricator
limit: 50
- key: fabricator/source
limit: 10
value:
applyLimitPerUniqueValue: true
- key: fabricator/user
limit: 12
value:
applyLimitPerUniqueValue: true
- key: metrics-repo
limit: 50
- key: metrics-repo
limit: 20
value: event_source
- key: metrics-repo
limit: 25
value: analysis_exposures
- key: metrics-repo
limit: 40
value: metric_analysis
- key: metrics-repo
limit: 30
value: analysis_quality_tests
- key: simdash
limit: 50
- key: curator
limit: 50
run_launcher:
module: dagster_k8s
class: K8sRunLauncher
config:
dagster_home: /opt/dagster/dagster_home
image_pull_policy: Always
instance_config_map: dagster-instance
job_namespace: dagster
load_incluster_config: true
postgres_password_secret: dagster-postgresql-secret
service_account_name: dagster
run_monitoring:
enabled: true
start_timeout_seconds: 3000
poll_interval_seconds: 300
sensors:
use_threads: true
num_workers: 4
retention:
sensor:
purge_after_days:
failure: 90
skipped: 7
started: -1
success: -1
schedule:
purge_after_days: -1
telemetry:
enabled: false
Hebo Yang
05/16/2023, 4:15 PMkubectl get po -n dagster | grep 09829157-20bc-4ff4-a734-6fb580ba19a3
dagster-run-09829157-20bc-4ff4-a734-6fb580ba19a3-1-cmqs9 0/1 OOMKilled 0 14h
dagster-run-09829157-20bc-4ff4-a734-6fb580ba19a3-2-slcrq 0/1 OOMKilled 0 13h
dagster-run-09829157-20bc-4ff4-a734-6fb580ba19a3-3-gxlgd 0/1 Completed 0 12h
daniel
05/16/2023, 4:15 PMdaniel
05/16/2023, 4:15 PMHebo Yang
05/16/2023, 4:15 PMkubectl get job -n dagster | grep 09829157-20bc-4ff4-a734-6fb580ba19a3
dagster-run-09829157-20bc-4ff4-a734-6fb580ba19a3 0/1 14h 14h
dagster-run-09829157-20bc-4ff4-a734-6fb580ba19a3-1 0/1 14h 14h
dagster-run-09829157-20bc-4ff4-a734-6fb580ba19a3-2 0/1 13h 13h
dagster-run-09829157-20bc-4ff4-a734-6fb580ba19a3-3 1/1 16m 12h
daniel
05/16/2023, 4:16 PMdaniel
05/16/2023, 4:16 PMHebo Yang
05/16/2023, 4:18 PMdaniel
05/16/2023, 4:18 PMHebo Yang
05/16/2023, 4:20 PMHebo Yang
05/16/2023, 4:20 PMdaniel
05/16/2023, 5:00 PMdagsterDaemon:
runRetries:
enabled: False
you didn't have the dagsterDaemon but i assume it was theredaniel
05/16/2023, 5:03 PMdaniel
05/16/2023, 5:03 PMrunMonitoring
daniel
05/16/2023, 5:40 PMdaniel
05/16/2023, 6:07 PMdaniel
05/16/2023, 6:08 PMHebo Yang
05/16/2023, 6:09 PMrunMonitoring:
enabled: true
startTimeoutSeconds: 3000
pollIntervalSeconds: 300
maxResumeRunAttempts: ~
daniel
05/16/2023, 6:09 PMdaniel
05/16/2023, 6:09 PMHebo Yang
05/16/2023, 6:10 PMHebo Yang
05/16/2023, 6:10 PMdaniel
05/16/2023, 6:11 PMdaniel
05/16/2023, 6:11 PM