mirror of
https://github.com/tdurieux/anonymous_github.git
synced 2026-03-28 00:00:20 +01:00
feat: handle repository download and remove using a job queue
This commit is contained in:
@@ -14,6 +14,7 @@ import GitHubBase from "./source/GitHubBase";
|
||||
import Conference from "./Conference";
|
||||
import ConferenceModel from "./database/conference/conferences.model";
|
||||
import AnonymousError from "./AnonymousError";
|
||||
import { downloadQueue } from "./queue";
|
||||
|
||||
export default class Repository {
|
||||
private _model: IAnonymizedRepositoryDocument;
|
||||
@@ -103,16 +104,21 @@ export default class Repository {
|
||||
this.expire();
|
||||
}
|
||||
}
|
||||
if (this.status == "expired") {
|
||||
throw new AnonymousError("repository_expired", this);
|
||||
}
|
||||
if (this.status == "removed") {
|
||||
if (
|
||||
this.status == "expired" ||
|
||||
this.status == "expiring" ||
|
||||
this.status == "removing" ||
|
||||
this.status == "removed"
|
||||
) {
|
||||
throw new AnonymousError("repository_expired", this);
|
||||
}
|
||||
const fiveMinuteAgo = new Date();
|
||||
fiveMinuteAgo.setMinutes(fiveMinuteAgo.getMinutes() - 5);
|
||||
|
||||
if (this.status == "download" && this._model.statusDate > fiveMinuteAgo) {
|
||||
if (
|
||||
this.status == "preparing" ||
|
||||
(this.status == "download" && this._model.statusDate > fiveMinuteAgo)
|
||||
) {
|
||||
throw new AnonymousError("repository_not_ready", this);
|
||||
}
|
||||
}
|
||||
@@ -136,17 +142,31 @@ export default class Repository {
|
||||
* @returns void
|
||||
*/
|
||||
async updateIfNeeded(): Promise<void> {
|
||||
if (
|
||||
this.status == "expired" ||
|
||||
this.status == "expiring" ||
|
||||
this.status == "removing" ||
|
||||
this.status == "removed"
|
||||
) {
|
||||
throw new AnonymousError("repository_expired", this);
|
||||
}
|
||||
|
||||
const fiveMinuteAgo = new Date();
|
||||
fiveMinuteAgo.setMinutes(fiveMinuteAgo.getMinutes() - 5);
|
||||
if (this.status != "ready") {
|
||||
if (
|
||||
this._model.statusDate < fiveMinuteAgo &&
|
||||
this.status != "preparing"
|
||||
) {
|
||||
await this.updateStatus("preparing");
|
||||
await downloadQueue.add(this, { jobId: this.repoId });
|
||||
}
|
||||
throw new AnonymousError("repository_not_ready", this);
|
||||
}
|
||||
|
||||
const yesterday = new Date();
|
||||
yesterday.setDate(yesterday.getDate() - 1);
|
||||
|
||||
if (this._model.options.update && this._model.lastView < yesterday) {
|
||||
|
||||
const fiveMinuteAgo = new Date();
|
||||
fiveMinuteAgo.setMinutes(fiveMinuteAgo.getMinutes() - 5);
|
||||
if (this.status == "download" && this._model.statusDate > fiveMinuteAgo) {
|
||||
throw new AnonymousError("repository_not_ready", this);
|
||||
}
|
||||
|
||||
// Only GitHubBase can be update for the moment
|
||||
if (this.source instanceof GitHubBase) {
|
||||
const branches = await this.source.githubRepository.branches({
|
||||
@@ -154,30 +174,25 @@ export default class Repository {
|
||||
accessToken: await this.source.getToken(),
|
||||
});
|
||||
const branch = this.source.branch;
|
||||
if (
|
||||
branch.commit ==
|
||||
branches.filter((f) => f.name == branch.name)[0]?.commit
|
||||
) {
|
||||
const newCommit = branches.filter((f) => f.name == branch.name)[0]
|
||||
?.commit;
|
||||
if (branch.commit == newCommit) {
|
||||
console.log(`${this._model.repoId} is up to date`);
|
||||
return;
|
||||
}
|
||||
this._model.source.commit = branches.filter(
|
||||
(f) => f.name == branch.name
|
||||
)[0]?.commit;
|
||||
branch.commit = this._model.source.commit;
|
||||
this._model.source.commit = newCommit;
|
||||
branch.commit = newCommit;
|
||||
|
||||
if (!this._model.source.commit) {
|
||||
if (!newCommit) {
|
||||
console.error(
|
||||
`${branch.name} for ${this.source.githubRepository.fullName} is not found`
|
||||
);
|
||||
throw new AnonymousError("branch_not_found", this);
|
||||
}
|
||||
this._model.anonymizeDate = new Date();
|
||||
console.log(
|
||||
`${this._model.repoId} will be updated to ${this._model.source.commit}`
|
||||
);
|
||||
console.log(`${this._model.repoId} will be updated to ${newCommit}`);
|
||||
await this.resetSate("preparing");
|
||||
await this.anonymize();
|
||||
await downloadQueue.add(this, { jobId: this.repoId });
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -219,14 +234,18 @@ export default class Repository {
|
||||
* Expire the repository
|
||||
*/
|
||||
async expire() {
|
||||
return this.resetSate("expired");
|
||||
await this.updateStatus("expiring");
|
||||
await this.resetSate();
|
||||
await this.updateStatus("expired");
|
||||
}
|
||||
|
||||
/**
|
||||
* Remove the repository
|
||||
*/
|
||||
async remove() {
|
||||
return this.resetSate("removed");
|
||||
await this.updateStatus("removing");
|
||||
await this.resetSate();
|
||||
await this.updateStatus("removed");
|
||||
}
|
||||
|
||||
/**
|
||||
@@ -234,8 +253,10 @@ export default class Repository {
|
||||
*/
|
||||
async resetSate(status?: RepositoryStatus) {
|
||||
if (status) this._model.status = status;
|
||||
// remove attribute
|
||||
this._model.size = { storage: 0, file: 0 };
|
||||
this._model.originalFiles = null;
|
||||
// remove cache
|
||||
return Promise.all([
|
||||
this._model.save(),
|
||||
storage.rm(this._model.repoId + "/"),
|
||||
|
||||
50
src/queue.ts
Normal file
50
src/queue.ts
Normal file
@@ -0,0 +1,50 @@
|
||||
import * as Queue from "bull";
|
||||
import config from "../config";
|
||||
import { getRepository } from "./database/database";
|
||||
import Repository from "./Repository";
|
||||
|
||||
export const removeQueue = new Queue<Repository>("repository removal", {
|
||||
redis: {
|
||||
host: config.REDIS_HOSTNAME,
|
||||
port: config.REDIS_PORT,
|
||||
},
|
||||
});
|
||||
removeQueue.on("completed", async (job) => {
|
||||
await job.remove();
|
||||
});
|
||||
export const downloadQueue = new Queue<Repository>("repository download", {
|
||||
redis: {
|
||||
host: config.REDIS_HOSTNAME,
|
||||
port: config.REDIS_PORT,
|
||||
},
|
||||
});
|
||||
downloadQueue.on("completed", async (job) => {
|
||||
await job.remove();
|
||||
});
|
||||
|
||||
removeQueue.process(5, async (job) => {
|
||||
console.log(`${job.data.repoId} is going to be removed`);
|
||||
try {
|
||||
const repo = await getRepository(job.data.repoId);
|
||||
await repo.remove();
|
||||
} catch (error) {
|
||||
console.log("error", error);
|
||||
} finally {
|
||||
console.log(`${job.data.repoId} is removed`);
|
||||
}
|
||||
});
|
||||
|
||||
downloadQueue.process(2, async (job) => {
|
||||
console.log(`${job.data.repoId} is going to be downloaded`);
|
||||
try {
|
||||
const repo = await getRepository(job.data.repoId);
|
||||
job.progress("get_repo");
|
||||
await repo.remove();
|
||||
job.progress("get_remove");
|
||||
await repo.anonymize();
|
||||
} catch (error) {
|
||||
console.log("error", error);
|
||||
} finally {
|
||||
console.log(`${job.data.repoId} is downloaded`);
|
||||
}
|
||||
});
|
||||
@@ -12,6 +12,7 @@ import { IAnonymizedRepositoryDocument } from "../database/anonymizedRepositorie
|
||||
import Repository from "../Repository";
|
||||
import ConferenceModel from "../database/conference/conferences.model";
|
||||
import AnonymousError from "../AnonymousError";
|
||||
import { downloadQueue, removeQueue } from "../queue";
|
||||
|
||||
const router = express.Router();
|
||||
|
||||
@@ -65,12 +66,15 @@ router.post(
|
||||
const repo = await getRepo(req, res, { nocheck: true });
|
||||
if (!repo) return;
|
||||
|
||||
if (repo.status == "preparing" || repo.status == "removing") return;
|
||||
|
||||
const user = await getUser(req);
|
||||
if (repo.owner.id != user.id) {
|
||||
return res.status(401).json({ error: "not_authorized" });
|
||||
}
|
||||
await repo.anonymize();
|
||||
res.end("ok");
|
||||
await repo.updateStatus("preparing");
|
||||
await downloadQueue.add(repo, {jobId: repo.repoId});
|
||||
res.json({ status: repo.status });
|
||||
} catch (error) {
|
||||
handleError(error, res);
|
||||
}
|
||||
@@ -83,14 +87,16 @@ router.delete(
|
||||
async (req: express.Request, res: express.Response) => {
|
||||
const repo = await getRepo(req, res, { nocheck: true });
|
||||
if (!repo) return;
|
||||
// if (repo.status == "removing") return res.json({ status: repo.status });
|
||||
try {
|
||||
if (repo.status == "removed") throw new AnonymousError("is_removed");
|
||||
const user = await getUser(req);
|
||||
if (repo.owner.id != user.id) {
|
||||
return res.status(401).json({ error: "not_authorized" });
|
||||
}
|
||||
await repo.remove();
|
||||
console.log(`${req.params.repoId} is removed`);
|
||||
return res.json("ok");
|
||||
await repo.updateStatus("removing");
|
||||
await removeQueue.add(repo, {jobId: repo.repoId});
|
||||
return res.json({ status: repo.status });
|
||||
} catch (error) {
|
||||
handleError(error, res);
|
||||
}
|
||||
@@ -305,8 +311,8 @@ router.post(
|
||||
}
|
||||
repo.model.conference = repoUpdate.conference;
|
||||
await repo.updateStatus("preparing");
|
||||
res.send("ok");
|
||||
new Repository(repo.model).anonymize();
|
||||
res.json({ status: repo.status });
|
||||
await downloadQueue.add(repo, {jobId: repo.repoId});
|
||||
} catch (error) {
|
||||
return handleError(error, res);
|
||||
}
|
||||
@@ -369,11 +375,14 @@ router.post("/", async (req: express.Request, res: express.Response) => {
|
||||
}
|
||||
}
|
||||
|
||||
res.send("ok");
|
||||
new Repository(repo).anonymize();
|
||||
res.send({ status: repo.status });
|
||||
downloadQueue.add(new Repository(repo), {jobId: repo.repoId});
|
||||
} catch (error) {
|
||||
if (error.message?.indexOf(" duplicate key") > -1) {
|
||||
return handleError(new AnonymousError("repoId_already_used", repoUpdate.repoId), res);
|
||||
return handleError(
|
||||
new AnonymousError("repoId_already_used", repoUpdate.repoId),
|
||||
res
|
||||
);
|
||||
}
|
||||
return handleError(error, res);
|
||||
}
|
||||
|
||||
@@ -3,7 +3,6 @@ import * as express from "express";
|
||||
import * as stream from "stream";
|
||||
import config from "../../config";
|
||||
|
||||
|
||||
import { getRepo, handleError } from "./route-utils";
|
||||
|
||||
const router = express.Router();
|
||||
@@ -23,7 +22,7 @@ router.get(
|
||||
|
||||
// cache the file for 6 hours
|
||||
res.header("Cache-Control", "max-age=21600000");
|
||||
await pipeline(repo.zip(), res)
|
||||
await pipeline(repo.zip(), res);
|
||||
} catch (error) {
|
||||
handleError(error, res);
|
||||
}
|
||||
@@ -60,7 +59,6 @@ router.get(
|
||||
) {
|
||||
redirectURL = repo.source.url;
|
||||
} else {
|
||||
repo.check();
|
||||
await repo.updateIfNeeded();
|
||||
}
|
||||
|
||||
|
||||
@@ -115,7 +115,9 @@ export type RepositoryStatus =
|
||||
| "download"
|
||||
| "ready"
|
||||
| "expired"
|
||||
| "expiring"
|
||||
| "removed"
|
||||
| "removing"
|
||||
| "error";
|
||||
|
||||
export type ConferenceStatus = "ready" | "expired" | "removed";
|
||||
|
||||
Reference in New Issue
Block a user