Skip to content

Commit 9f58d3c

Browse files
authored
Merge pull request #4 from PreferredAI/fix-crawler
2 parents b101d10 + effa25c commit 9f58d3c

File tree

4 files changed

+24
-2
lines changed

4 files changed

+24
-2
lines changed

.github/workflows/nextjs.yml

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,10 +8,20 @@ on:
88
# Runs on pushes targeting the default branch
99
push:
1010
branches: ["main"]
11+
paths-ignore:
12+
# If there are changes to these files, wait for the update-publications workflow to finish
13+
- "scripts/crawl-publications.ts"
14+
- ".github/workflows/update-publications.yml"
1115

1216
# Allows you to run this workflow manually from the Actions tab
1317
workflow_dispatch:
1418

19+
# Run after update-publications workflow
20+
workflow_run:
21+
workflows: ["Update Publications"]
22+
types:
23+
- completed
24+
1525
# Sets permissions of the GITHUB_TOKEN to allow deployment to GitHub Pages
1626
permissions:
1727
contents: read

.github/workflows/update-publications.yml

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,11 @@ on:
66
schedule:
77
- cron: "0 0 * * 0"
88

9+
push:
10+
paths:
11+
- ".github/workflows/update-publications.yml"
12+
- "scripts/crawl-publications.ts"
13+
914
# Allow manual trigger
1015
workflow_dispatch:
1116

scripts/crawl-publications.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -309,7 +309,7 @@ function parsePublicationFromLi(liContent: string): Publication | null {
309309
const isPaperHost = PAPER_HOST_DOMAINS.some(domain => url.includes(domain));
310310
const isTitle = isPaperHost &&
311311
text.length > MIN_TITLE_LINK_TEXT_LENGTH &&
312-
!text.toLowerCase().includes('code');
312+
(!text.toLowerCase().includes('code') || text.length > 30);
313313

314314
links.push({ text, url, isTitle });
315315
}

src/data/publications.ts

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
// Auto-generated by crawl-publications.ts
2-
// Last updated: 2025-12-14T17:18:31.964Z
2+
// Last updated: 2025-12-16T17:41:08.912Z
33

44
export interface Publication {
55
title: string;
@@ -29,11 +29,13 @@ export const PUBLICATIONS_DATA: YearSection[] = [
2929
title: "Conv4Rec: A 1-by-1 Convolutional AutoEncoder for User Profiling through Joint Analysis of Implicit and Explicit Feedbacks",
3030
authors: "Antoine Ledent, Petr Kasalický, Rodrigo Alves, and Hady W. Lauw",
3131
venue: "IEEE Transactions on Neural Networks and Learning Systems (TNNLS), Vol. 36, No. 12, Dec 2025",
32+
pdfUrl: "https://arxiv.org/abs/2509.07499",
3233
},
3334
{
3435
title: "Parameter-Efficient Variational AutoEncoder for Multimodal Multi-Interest Recommendation",
3536
authors: "Nhu-Thuat Tran and Hady W. Lauw",
3637
venue: "ACM Multimedia Conference (ACM MM'25), Oct 2025",
38+
pdfUrl: "https://www.dropbox.com/scl/fi/q7g7ct173jxgqkuz5s4tb/acmmm25.pdf?rlkey=7dve8mod7trsjt6ubhgf02wm7&dl=0",
3739
},
3840
{
3941
title: "Optimal Transport Alignment of User Preferences from Ratings and Texts",
@@ -63,6 +65,7 @@ export const PUBLICATIONS_DATA: YearSection[] = [
6365
title: "VARIUM: Variational Autoencoder for Multi-Interest Representation with Inter-User Memory",
6466
authors: "Nhu-Thuat Tran and Hady W. Lauw",
6567
venue: "ACM International Conference on Web Search and Data Mining (WSDM'25), Mar 2025",
68+
pdfUrl: "https://www.dropbox.com/scl/fi/5nezl5hq0xhd0jrk6012n/wsdm25a.pdf?rlkey=bk8s3akrfzjv4ykse6thomzgd&dl=0",
6669
},
6770
{
6871
title: "Selecting Comparative Sets of Reviews Across Multiple Items",
@@ -193,6 +196,7 @@ export const PUBLICATIONS_DATA: YearSection[] = [
193196
title: "Multi-Representation Variational Autoencoder via Iterative Latent Attention and Implicit Differentiation",
194197
authors: "Nhu-Thuat Tran and Hady W. Lauw",
195198
venue: "ACM International Conference on Information and Knowledge Management (CIKM'23), Oct 2023",
199+
pdfUrl: "https://www.dropbox.com/scl/fi/eb30uta1e3vmn6gh1f8lu/cikm23.pdf?rlkey=ljfxqg8j9580wysvi70emu6d7&dl=0",
196200
},
197201
{
198202
title: "Robust Bidirectional Poly-Matching",
@@ -384,6 +388,7 @@ export const PUBLICATIONS_DATA: YearSection[] = [
384388
title: "Bilateral Variational Autoencoder for Collaborative Filtering",
385389
authors: "Quoc-Tuan Truong, Aghiles Salah, and Hady W. Lauw",
386390
venue: "ACM International Conference on Web Search and Data Mining (WSDM'21), Mar 2021",
391+
pdfUrl: "https://www.dropbox.com/s/8id1sf17cimp6j5/wsdm21b.pdf?dl=0",
387392
},
388393
{
389394
title: "Explainable Recommendation with Comparative Constraints on Product Aspects",
@@ -428,6 +433,7 @@ export const PUBLICATIONS_DATA: YearSection[] = [
428433
title: "Topic Modeling on Document Networks with Adjacent-Encoder",
429434
authors: "Ce Zhang and Hady W. Lauw",
430435
venue: "AAAI Conference on Artificial Intelligence (AAAI'20), Feb 2020.",
436+
pdfUrl: "https://www.dropbox.com/s/eqkyfviowwwleey/aaai20a.pdf?dl=0",
431437
extraLinks: [{"text":"Code","url":"https://github.com/PreferredAI/adjacent-encoder"}],
432438
},
433439
],
@@ -521,6 +527,7 @@ export const PUBLICATIONS_DATA: YearSection[] = [
521527
title: "Collaborative Topic Regression with Denoising AutoEncoder for Content and Community Co-Representation",
522528
authors: "Trong T. Nguyen and Hady W. Lauw",
523529
venue: "ACM Conference on Information and Knowledge Management (CIKM'17), short paper, Nov 2017",
530+
pdfUrl: "https://www.dropbox.com/s/bq5q9lxn9igiyvp/cikm17b.pdf?dl=0",
524531
},
525532
{
526533
title: "SemVis: Semantic Visualization for Interactive Topical Analysis",

0 commit comments

Comments
 (0)