Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 4 additions & 0 deletions src/config.ts
Original file line number Diff line number Diff line change
Expand Up @@ -39,6 +39,10 @@ let config = {
appPrivateKeyPath: '',
appId: 0,
},
gitlab: {
token: '',
apiUrl: '',
},
google: {
map: {
key: '',
Expand Down
171 changes: 171 additions & 0 deletions src/cron/tasks/updateGitlabRepos.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,171 @@
import { Task } from '..';
import getConfig from '../../config';
import { insertRecords, query } from '../../db/clickhouse';
import { formatDate, getLogger } from '../../utils';
import { get } from 'https';

/**
* This task is used to update GitLab repos basic info
*/
const task: Task = {
cron: '0 10 * * *',
singleInstance: true,
callback: async () => {
const logger = getLogger('UpdateGitlabRepoTask');
const config = await getConfig();
const gitlabToken = config.gitlab.token;
const gitlabApiUrl = config.gitlab.apiUrl;

if (!gitlabToken || !gitlabApiUrl || gitlabToken === '' || gitlabApiUrl === '') {
logger.error('GitLab token or API URL is not set');
return;
}

const tableName = 'gitlab_repo_list';

const createGitlabRepoListTable = async () => {
const createTableQuery = `
CREATE TABLE IF NOT EXISTS ${tableName} (
id UInt64,
namespace_id UInt64,
namespace_name String,
name String,
description String,
default_branch String,
archived UInt8,
topics Array(String),
tag_list Array(String),
created_at DateTime,
stars_count UInt32,
forks_count UInt32,
last_activity_at DateTime,
updated_at DateTime,
inserted_at UInt64
)
ENGINE = ReplacingMergeTree(inserted_at)
ORDER BY id
SETTINGS index_granularity = 8192
`;
await query(createTableQuery);
};
await createGitlabRepoListTable();

const parseProject = (project: ProjectRaw): ProjectItem => {
return {
id: project.id,
namespace_id: project.namespace.id,
namespace_name: project.namespace.full_path,
name: project.path_with_namespace,
description: project.description ?? '',
default_branch: project.default_branch ?? '',
archived: project.archived ? 1 : 0,
topics: project.topics,
tag_list: project.tag_list,
created_at: formatDate(project.created_at),
stars_count: project.stars_count,
forks_count: project.forks_count,
last_activity_at: formatDate(project.last_activity_at),
updated_at: formatDate(project.updated_at),
inserted_at: 0, // will be set when saving
};
};

const getProjects = async (lastActivityAfter: string, limit: number): Promise<ProjectRaw[]> => {
const projects = await new Promise<ProjectRaw[]>((resolve, reject) => {
const params = new URLSearchParams({
last_activity_after: lastActivityAfter,
per_page: limit.toString(),
sort: 'asc',
order_by: 'last_activity_at',
});
const url = new URL(`${gitlabApiUrl}/projects?${params.toString()}`);
const options = {
hostname: url.hostname,
path: url.pathname + url.search,
headers: {
'Authorization': `Bearer ${gitlabToken}`,
'User-Agent': 'opendigger-bot'
}
};
get(options, (res) => {
let data = '';
res.on('data', (chunk) => data += chunk);
res.on('end', () => {
try {
resolve(JSON.parse(data));
} catch (e) {
logger.error(`Error parsing projects: ${data}`);
reject(e);
}
});
}).on('error', reject);
});
return projects;
};

const saveProjects = async (projects: ProjectItem[]) => {
await insertRecords(projects.map(project => ({
...project,
inserted_at: new Date().getTime(),
})), tableName);
};

const maxLastActivityAt = await query<any[]>(`SELECT MAX(last_activity_at) AS max_last_activity_at FROM ${tableName}`);
let lastActivityAt = new Date(maxLastActivityAt[0][0]).toISOString();
let projects: ProjectRaw[] = [];
logger.info(`Max last activity at in database: ${lastActivityAt}`);
let totalCount = 0;
do {
try {
projects = await getProjects(lastActivityAt, 100);
await saveProjects(projects.map(parseProject));
lastActivityAt = projects[projects.length - 1].last_activity_at;
totalCount += projects.length;
logger.info(`Saved ${projects.length} projects, starting from ${lastActivityAt}, total count: ${totalCount}`);
} catch (error: any) {
logger.error(`Error getting projects starting from ${lastActivityAt}: ${error.message}\n${error.stack}`);
break;
}
} while (projects.length > 0);
logger.info(`Task done, total count: ${totalCount}`);
}
};

interface ProjectRaw {
id: number;
description: string;
path_with_namespace: string;
created_at: string;
default_branch: string;
tag_list: string[];
topics: string[];
archived: boolean;
forks_count: number;
stars_count: number;
last_activity_at: string;
updated_at: string;
namespace: {
id: number;
full_path: string;
}
};

interface ProjectItem {
id: number;
namespace_id: number;
namespace_name: string;
name: string;
description: string;
default_branch: string;
archived: number;
topics: string[];
tag_list: string[];
created_at: string;
stars_count: number;
forks_count: number;
last_activity_at: string;
updated_at: string;
inserted_at: number;
}

module.exports = task;