Skip to content

Commit 0ee4234

Browse files
authored
Reduce false error logging (round 1) (#2415)
* Don't log an error when the snapshot shouldn't be created, it's normal for this to happen * Slack alerts, skip `account_inactive` errors * v3 finalize run with no locked isn't an error * Another false error * Finalize run CRASHED runs were logging errors * All slack alert errors are warnings except invalid blocks
1 parent 471c960 commit 0ee4234

File tree

4 files changed

+32
-15
lines changed

4 files changed

+32
-15
lines changed

apps/webapp/app/v3/services/alerts/deliverAlert.server.ts

Lines changed: 15 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -158,7 +158,7 @@ export class DeliverAlertService extends BaseService {
158158
}
159159
} catch (error) {
160160
if (error instanceof SkipRetryError) {
161-
logger.error("[DeliverAlert] Skipping retry", {
161+
logger.warn("[DeliverAlert] Skipping retry", {
162162
reason: error.message,
163163
});
164164

@@ -951,7 +951,7 @@ export class DeliverAlertService extends BaseService {
951951
return await client.chat.postMessage(message);
952952
} catch (error) {
953953
if (isWebAPIRateLimitedError(error)) {
954-
logger.error("[DeliverAlert] Slack rate limited", {
954+
logger.warn("[DeliverAlert] Slack rate limited", {
955955
error,
956956
message,
957957
});
@@ -960,7 +960,7 @@ export class DeliverAlertService extends BaseService {
960960
}
961961

962962
if (isWebAPIHTTPError(error)) {
963-
logger.error("[DeliverAlert] Slack HTTP error", {
963+
logger.warn("[DeliverAlert] Slack HTTP error", {
964964
error,
965965
message,
966966
});
@@ -969,7 +969,7 @@ export class DeliverAlertService extends BaseService {
969969
}
970970

971971
if (isWebAPIRequestError(error)) {
972-
logger.error("[DeliverAlert] Slack request error", {
972+
logger.warn("[DeliverAlert] Slack request error", {
973973
error,
974974
message,
975975
});
@@ -978,7 +978,7 @@ export class DeliverAlertService extends BaseService {
978978
}
979979

980980
if (isWebAPIPlatformError(error)) {
981-
logger.error("[DeliverAlert] Slack platform error", {
981+
logger.warn("[DeliverAlert] Slack platform error", {
982982
error,
983983
message,
984984
});
@@ -991,10 +991,19 @@ export class DeliverAlertService extends BaseService {
991991
throw new SkipRetryError("Slack invalid blocks");
992992
}
993993

994+
if (error.data.error === "account_inactive") {
995+
logger.info("[DeliverAlert] Slack account inactive, skipping retry", {
996+
error,
997+
message,
998+
});
999+
1000+
throw new SkipRetryError("Slack account inactive");
1001+
}
1002+
9941003
throw new Error("Slack platform error");
9951004
}
9961005

997-
logger.error("[DeliverAlert] Failed to send slack message", {
1006+
logger.warn("[DeliverAlert] Failed to send slack message", {
9981007
error,
9991008
message,
10001009
});

apps/webapp/app/v3/services/finalizeTaskRun.server.ts

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -150,7 +150,7 @@ export class FinalizeTaskRunService extends BaseService {
150150
}
151151

152152
if (isFatalRunStatus(run.status)) {
153-
logger.error("FinalizeTaskRunService: Fatal status", { runId: run.id, status: run.status });
153+
logger.warn("FinalizeTaskRunService: Fatal status", { runId: run.id, status: run.status });
154154

155155
const extendedRun = await this._prisma.taskRun.findFirst({
156156
where: { id: run.id },
@@ -170,7 +170,7 @@ export class FinalizeTaskRunService extends BaseService {
170170
});
171171

172172
if (extendedRun && extendedRun.runtimeEnvironment.type !== "DEVELOPMENT") {
173-
logger.error("FinalizeTaskRunService: Fatal status, requesting worker exit", {
173+
logger.warn("FinalizeTaskRunService: Fatal status, requesting worker exit", {
174174
runId: run.id,
175175
status: run.status,
176176
});
@@ -305,9 +305,10 @@ export class FinalizeTaskRunService extends BaseService {
305305
});
306306

307307
if (!run.lockedById) {
308-
logger.error(
308+
// This happens when a run is expired or was cancelled before an attempt, it's not a problem
309+
logger.info(
309310
"FinalizeTaskRunService: No lockedById, so can't get the BackgroundWorkerTask. Not creating an attempt.",
310-
{ runId: run.id }
311+
{ runId: run.id, status: run.status }
311312
);
312313
return;
313314
}

internal-packages/run-engine/src/engine/systems/checkpointSystem.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,7 @@ export class CheckpointSystem {
6262
snapshot.executionStatus === "QUEUED_EXECUTING");
6363

6464
if (!isValidSnapshot) {
65-
this.$.logger.error("Tried to createCheckpoint on an invalid snapshot", {
65+
this.$.logger.info("Tried to createCheckpoint on an invalid snapshot", {
6666
snapshot,
6767
snapshotId,
6868
});

internal-packages/run-engine/src/engine/systems/dequeueSystem.ts

Lines changed: 11 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ import { PrismaClientOrTransaction } from "@trigger.dev/database";
88
import { getRunWithBackgroundWorkerTasks } from "../db/worker.js";
99
import { sendNotificationToWorker } from "../eventBus.js";
1010
import { getMachinePreset } from "../machinePresets.js";
11-
import { isDequeueableExecutionStatus } from "../statuses.js";
11+
import { isDequeueableExecutionStatus, isExecuting } from "../statuses.js";
1212
import { RunEngineOptions } from "../types.js";
1313
import { ExecutionSnapshotSystem, getLatestExecutionSnapshot } from "./executionSnapshotSystem.js";
1414
import { RunAttemptSystem } from "./runAttemptSystem.js";
@@ -132,9 +132,16 @@ export class DequeueSystem {
132132
},
133133
tx: prisma,
134134
});
135-
this.$.logger.error(
136-
`RunEngine.dequeueFromWorkerQueue(): Run is not in a valid state to be dequeued: ${runId}\n ${snapshot.id}:${snapshot.executionStatus}`
137-
);
135+
136+
if (isExecuting(snapshot.executionStatus)) {
137+
this.$.logger.error(
138+
`RunEngine.dequeueFromWorkerQueue(): Run is not in a valid state to be dequeued: ${runId}\n ${snapshot.id}:${snapshot.executionStatus}`
139+
);
140+
} else {
141+
this.$.logger.warn(
142+
`RunEngine.dequeueFromWorkerQueue(): Run is in an expected not valid state to be dequeued: ${runId}\n ${snapshot.id}:${snapshot.executionStatus}`
143+
);
144+
}
138145

139146
return;
140147
}

0 commit comments

Comments
 (0)